#ifndef CUFFTDX_FFT_625_FP64_FWD_PTX_HPP
#define CUFFTDX_FFT_625_FP64_FWD_PTX_HPP



template<> __forceinline__ __device__ void cufftdx_private_function<540, double, 1>(cufftdx::detail::complex<double> *rmem, unsigned smem){

asm volatile (R"({
.reg .b32 r<11>;
.reg .f64 fd<1429>;
.reg .b64 rd<7>;
mov.u32 r1, %tid.y;
mov.u32 r2, %50;
mad.lo.s32 r3, r1, 5000, r2;
add.f64 fd101, %65, %105;
add.f64 fd102, %52, fd101;
add.f64 fd103, %78, %92;
add.f64 fd104, fd103, fd102;
add.f64 fd105, %67, %107;
add.f64 fd106, %53, fd105;
add.f64 fd107, %80, %93;
add.f64 fd108, fd107, fd106;
fma.rn.f64 fd109, fd101, 0d3FD3C6EF372FE950, %52;
mul.f64 fd110, fd103, 0d3FE9E3779B97F4A8;
sub.f64 fd111, fd109, fd110;
sub.f64 fd112, %67, %107;
mul.f64 fd113, fd112, 0d3FEE6F0E134454FF;
sub.f64 fd114, %80, %93;
mul.f64 fd115, fd114, 0dBFE2CF2304755A5E;
sub.f64 fd116, fd115, fd113;
sub.f64 fd117, fd111, fd116;
add.f64 fd118, fd116, fd111;
mul.f64 fd119, fd101, 0d3FE9E3779B97F4A8;
sub.f64 fd120, %52, fd119;
fma.rn.f64 fd121, fd103, 0d3FD3C6EF372FE950, fd120;
mul.f64 fd122, fd112, 0d3FE2CF2304755A5E;
mul.f64 fd123, fd114, 0d3FEE6F0E134454FF;
sub.f64 fd124, fd123, fd122;
sub.f64 fd125, fd121, fd124;
add.f64 fd126, fd124, fd121;
fma.rn.f64 fd127, fd105, 0d3FD3C6EF372FE950, %53;
mul.f64 fd128, fd107, 0d3FE9E3779B97F4A8;
sub.f64 fd129, fd127, fd128;
sub.f64 fd130, %65, %105;
mul.f64 fd131, fd130, 0d3FEE6F0E134454FF;
sub.f64 fd132, %78, %92;
mul.f64 fd133, fd132, 0dBFE2CF2304755A5E;
sub.f64 fd134, fd133, fd131;
add.f64 fd135, fd134, fd129;
sub.f64 fd136, fd129, fd134;
mul.f64 fd137, fd105, 0d3FE9E3779B97F4A8;
sub.f64 fd138, %53, fd137;
fma.rn.f64 fd139, fd107, 0d3FD3C6EF372FE950, fd138;
mul.f64 fd140, fd130, 0d3FE2CF2304755A5E;
mul.f64 fd141, fd132, 0d3FEE6F0E134454FF;
sub.f64 fd142, fd141, fd140;
add.f64 fd143, fd142, fd139;
sub.f64 fd144, fd139, fd142;
add.f64 fd145, %68, %108;
add.f64 fd146, %54, fd145;
add.f64 fd147, %81, %94;
add.f64 fd148, fd147, fd146;
add.f64 fd149, %69, %109;
add.f64 fd150, %56, fd149;
add.f64 fd151, %83, %96;
add.f64 fd152, fd151, fd150;
fma.rn.f64 fd153, fd145, 0d3FD3C6EF372FE950, %54;
mul.f64 fd154, fd147, 0d3FE9E3779B97F4A8;
sub.f64 fd155, fd153, fd154;
sub.f64 fd156, %69, %109;
mul.f64 fd157, fd156, 0d3FEE6F0E134454FF;
sub.f64 fd158, %83, %96;
mul.f64 fd159, fd158, 0dBFE2CF2304755A5E;
sub.f64 fd160, fd159, fd157;
sub.f64 fd161, fd155, fd160;
add.f64 fd162, fd160, fd155;
mul.f64 fd163, fd145, 0d3FE9E3779B97F4A8;
sub.f64 fd164, %54, fd163;
fma.rn.f64 fd165, fd147, 0d3FD3C6EF372FE950, fd164;
mul.f64 fd166, fd156, 0d3FE2CF2304755A5E;
mul.f64 fd167, fd158, 0d3FEE6F0E134454FF;
sub.f64 fd168, fd167, fd166;
sub.f64 fd169, fd165, fd168;
add.f64 fd170, fd168, fd165;
fma.rn.f64 fd171, fd149, 0d3FD3C6EF372FE950, %56;
mul.f64 fd172, fd151, 0d3FE9E3779B97F4A8;
sub.f64 fd173, fd171, fd172;
sub.f64 fd174, %68, %108;
mul.f64 fd175, fd174, 0d3FEE6F0E134454FF;
sub.f64 fd176, %81, %94;
mul.f64 fd177, fd176, 0dBFE2CF2304755A5E;
sub.f64 fd178, fd177, fd175;
add.f64 fd179, fd178, fd173;
sub.f64 fd180, fd173, fd178;
mul.f64 fd181, fd149, 0d3FE9E3779B97F4A8;
sub.f64 fd182, %56, fd181;
fma.rn.f64 fd183, fd151, 0d3FD3C6EF372FE950, fd182;
mul.f64 fd184, fd174, 0d3FE2CF2304755A5E;
mul.f64 fd185, fd176, 0d3FEE6F0E134454FF;
sub.f64 fd186, fd185, fd184;
add.f64 fd187, fd186, fd183;
sub.f64 fd188, fd183, fd186;
add.f64 fd189, %70, %110;
add.f64 fd190, %57, fd189;
add.f64 fd191, %84, %97;
add.f64 fd192, fd191, fd190;
add.f64 fd193, %72, %112;
add.f64 fd194, %59, fd193;
add.f64 fd195, %85, %99;
add.f64 fd196, fd195, fd194;
fma.rn.f64 fd197, fd189, 0d3FD3C6EF372FE950, %57;
mul.f64 fd198, fd191, 0d3FE9E3779B97F4A8;
sub.f64 fd199, fd197, fd198;
sub.f64 fd200, %72, %112;
mul.f64 fd201, fd200, 0d3FEE6F0E134454FF;
sub.f64 fd202, %85, %99;
mul.f64 fd203, fd202, 0dBFE2CF2304755A5E;
sub.f64 fd204, fd203, fd201;
sub.f64 fd205, fd199, fd204;
add.f64 fd206, fd204, fd199;
mul.f64 fd207, fd189, 0d3FE9E3779B97F4A8;
sub.f64 fd208, %57, fd207;
fma.rn.f64 fd209, fd191, 0d3FD3C6EF372FE950, fd208;
mul.f64 fd210, fd200, 0d3FE2CF2304755A5E;
mul.f64 fd211, fd202, 0d3FEE6F0E134454FF;
sub.f64 fd212, fd211, fd210;
sub.f64 fd213, fd209, fd212;
add.f64 fd214, fd212, fd209;
fma.rn.f64 fd215, fd193, 0d3FD3C6EF372FE950, %59;
mul.f64 fd216, fd195, 0d3FE9E3779B97F4A8;
sub.f64 fd217, fd215, fd216;
sub.f64 fd218, %70, %110;
mul.f64 fd219, fd218, 0d3FEE6F0E134454FF;
sub.f64 fd220, %84, %97;
mul.f64 fd221, fd220, 0dBFE2CF2304755A5E;
sub.f64 fd222, fd221, fd219;
add.f64 fd223, fd222, fd217;
sub.f64 fd224, fd217, fd222;
mul.f64 fd225, fd193, 0d3FE9E3779B97F4A8;
sub.f64 fd226, %59, fd225;
fma.rn.f64 fd227, fd195, 0d3FD3C6EF372FE950, fd226;
mul.f64 fd228, fd218, 0d3FE2CF2304755A5E;
mul.f64 fd229, fd220, 0d3FEE6F0E134454FF;
sub.f64 fd230, fd229, fd228;
add.f64 fd231, fd230, fd227;
sub.f64 fd232, fd227, fd230;
add.f64 fd233, %73, %113;
add.f64 fd234, %60, fd233;
add.f64 fd235, %86, %100;
add.f64 fd236, fd235, fd234;
add.f64 fd237, %75, %115;
add.f64 fd238, %61, fd237;
add.f64 fd239, %88, %101;
add.f64 fd240, fd239, fd238;
fma.rn.f64 fd241, fd233, 0d3FD3C6EF372FE950, %60;
mul.f64 fd242, fd235, 0d3FE9E3779B97F4A8;
sub.f64 fd243, fd241, fd242;
sub.f64 fd244, %75, %115;
mul.f64 fd245, fd244, 0d3FEE6F0E134454FF;
sub.f64 fd246, %88, %101;
mul.f64 fd247, fd246, 0dBFE2CF2304755A5E;
sub.f64 fd248, fd247, fd245;
sub.f64 fd249, fd243, fd248;
add.f64 fd250, fd248, fd243;
mul.f64 fd251, fd233, 0d3FE9E3779B97F4A8;
sub.f64 fd252, %60, fd251;
fma.rn.f64 fd253, fd235, 0d3FD3C6EF372FE950, fd252;
mul.f64 fd254, fd244, 0d3FE2CF2304755A5E;
mul.f64 fd255, fd246, 0d3FEE6F0E134454FF;
sub.f64 fd256, fd255, fd254;
sub.f64 fd257, fd253, fd256;
add.f64 fd258, fd256, fd253;
fma.rn.f64 fd259, fd237, 0d3FD3C6EF372FE950, %61;
mul.f64 fd260, fd239, 0d3FE9E3779B97F4A8;
sub.f64 fd261, fd259, fd260;
sub.f64 fd262, %73, %113;
mul.f64 fd263, fd262, 0d3FEE6F0E134454FF;
sub.f64 fd264, %86, %100;
mul.f64 fd265, fd264, 0dBFE2CF2304755A5E;
sub.f64 fd266, fd265, fd263;
add.f64 fd267, fd266, fd261;
sub.f64 fd268, fd261, fd266;
mul.f64 fd269, fd237, 0d3FE9E3779B97F4A8;
sub.f64 fd270, %61, fd269;
fma.rn.f64 fd271, fd239, 0d3FD3C6EF372FE950, fd270;
mul.f64 fd272, fd262, 0d3FE2CF2304755A5E;
mul.f64 fd273, fd264, 0d3FEE6F0E134454FF;
sub.f64 fd274, fd273, fd272;
add.f64 fd275, fd274, fd271;
sub.f64 fd276, fd271, fd274;
add.f64 fd277, %76, %116;
add.f64 fd278, %62, fd277;
add.f64 fd279, %89, %102;
add.f64 fd280, fd279, fd278;
add.f64 fd281, %77, %117;
add.f64 fd282, %64, fd281;
add.f64 fd283, %91, %104;
add.f64 fd284, fd283, fd282;
fma.rn.f64 fd285, fd277, 0d3FD3C6EF372FE950, %62;
mul.f64 fd286, fd279, 0d3FE9E3779B97F4A8;
sub.f64 fd287, fd285, fd286;
sub.f64 fd288, %77, %117;
mul.f64 fd289, fd288, 0d3FEE6F0E134454FF;
sub.f64 fd290, %91, %104;
mul.f64 fd291, fd290, 0dBFE2CF2304755A5E;
sub.f64 fd292, fd291, fd289;
sub.f64 fd293, fd287, fd292;
add.f64 fd294, fd292, fd287;
mul.f64 fd295, fd277, 0d3FE9E3779B97F4A8;
sub.f64 fd296, %62, fd295;
fma.rn.f64 fd297, fd279, 0d3FD3C6EF372FE950, fd296;
mul.f64 fd298, fd288, 0d3FE2CF2304755A5E;
mul.f64 fd299, fd290, 0d3FEE6F0E134454FF;
sub.f64 fd300, fd299, fd298;
sub.f64 fd301, fd297, fd300;
add.f64 fd302, fd300, fd297;
fma.rn.f64 fd303, fd281, 0d3FD3C6EF372FE950, %64;
mul.f64 fd304, fd283, 0d3FE9E3779B97F4A8;
sub.f64 fd305, fd303, fd304;
sub.f64 fd306, %76, %116;
mul.f64 fd307, fd306, 0d3FEE6F0E134454FF;
sub.f64 fd308, %89, %102;
mul.f64 fd309, fd308, 0dBFE2CF2304755A5E;
sub.f64 fd310, fd309, fd307;
add.f64 fd311, fd310, fd305;
sub.f64 fd312, fd305, fd310;
mul.f64 fd313, fd281, 0d3FE9E3779B97F4A8;
sub.f64 fd314, %64, fd313;
fma.rn.f64 fd315, fd283, 0d3FD3C6EF372FE950, fd314;
mul.f64 fd316, fd306, 0d3FE2CF2304755A5E;
mul.f64 fd317, fd308, 0d3FEE6F0E134454FF;
sub.f64 fd318, fd317, fd316;
add.f64 fd319, fd318, fd315;
sub.f64 fd320, fd315, fd318;
mov.u32 r4, %tid.x;
mul.f64 fd321, fd161, 0d3FEEFEA21D101EE0;
mul.f64 fd322, fd179, 0dBFCFD511FA1C0796;
sub.f64 fd323, fd321, fd322;
mul.f64 fd324, fd179, 0d3FEEFEA21D101EE0;
fma.rn.f64 fd325, fd161, 0dBFCFD511FA1C0796, fd324;
mul.f64 fd326, fd205, 0d3FEC0AB44E81C059;
mul.f64 fd327, fd223, 0dBFDED50D5CBFA951;
sub.f64 fd328, fd326, fd327;
mul.f64 fd329, fd223, 0d3FEC0AB44E81C059;
fma.rn.f64 fd330, fd205, 0dBFDED50D5CBFA951, fd329;
mul.f64 fd331, fd249, 0d3FE753B603D2B816;
mul.f64 fd332, fd267, 0dBFE5E7CF55112014;
sub.f64 fd333, fd331, fd332;
mul.f64 fd334, fd267, 0d3FE753B603D2B816;
fma.rn.f64 fd335, fd249, 0dBFE5E7CF55112014, fd334;
mul.f64 fd336, fd293, 0d3FE1257E3C182B51;
mul.f64 fd337, fd311, 0dBFEB04BBFF642E86;
sub.f64 fd338, fd336, fd337;
mul.f64 fd339, fd311, 0d3FE1257E3C182B51;
fma.rn.f64 fd340, fd293, 0dBFEB04BBFF642E86, fd339;
mul.f64 fd341, fd169, 0d3FEC0AB44E81C059;
mul.f64 fd342, fd187, 0dBFDED50D5CBFA951;
sub.f64 fd343, fd341, fd342;
mul.f64 fd344, fd187, 0d3FEC0AB44E81C059;
fma.rn.f64 fd345, fd169, 0dBFDED50D5CBFA951, fd344;
mul.f64 fd346, fd213, 0d3FE1257E3C182B51;
mul.f64 fd347, fd231, 0dBFEB04BBFF642E86;
sub.f64 fd348, fd346, fd347;
mul.f64 fd349, fd231, 0d3FE1257E3C182B51;
fma.rn.f64 fd350, fd213, 0dBFEB04BBFF642E86, fd349;
mul.f64 fd351, fd257, 0d3FB0130A1BE09379;
mul.f64 fd352, fd275, 0dBFEFEFD5BFE443FE;
sub.f64 fd353, fd351, fd352;
mul.f64 fd354, fd275, 0d3FB0130A1BE09379;
fma.rn.f64 fd355, fd257, 0dBFEFEFD5BFE443FE, fd354;
mul.f64 fd356, fd301, 0dBFDB3FF7C925819C;
mul.f64 fd357, fd319, 0dBFECF457DCDC158C;
sub.f64 fd358, fd356, fd357;
mul.f64 fd359, fd319, 0dBFDB3FF7C925819C;
fma.rn.f64 fd360, fd301, 0dBFECF457DCDC158C, fd359;
mul.f64 fd361, fd170, 0d3FE753B603D2B816;
mul.f64 fd362, fd188, 0dBFE5E7CF55112014;
sub.f64 fd363, fd361, fd362;
mul.f64 fd364, fd188, 0d3FE753B603D2B816;
fma.rn.f64 fd365, fd170, 0dBFE5E7CF55112014, fd364;
mul.f64 fd366, fd214, 0d3FB0130A1BE09379;
mul.f64 fd367, fd232, 0dBFEFEFD5BFE443FE;
sub.f64 fd368, fd366, fd367;
mul.f64 fd369, fd232, 0d3FB0130A1BE09379;
fma.rn.f64 fd370, fd214, 0dBFEFEFD5BFE443FE, fd369;
mul.f64 fd371, fd258, 0dBFE465C6FEB501BC;
mul.f64 fd372, fd276, 0dBFE8A80B635B6BEA;
sub.f64 fd373, fd371, fd372;
mul.f64 fd374, fd276, 0dBFE465C6FEB501BC;
fma.rn.f64 fd375, fd258, 0dBFE8A80B635B6BEA, fd374;
mul.f64 fd376, fd302, 0dBFEFBF675480D903;
mul.f64 fd377, fd320, 0dBFC00AEB5DA15BE0;
sub.f64 fd378, fd376, fd377;
mul.f64 fd379, fd320, 0dBFEFBF675480D903;
fma.rn.f64 fd380, fd302, 0dBFC00AEB5DA15BE0, fd379;
mul.f64 fd381, fd162, 0d3FE1257E3C182B51;
mul.f64 fd382, fd180, 0dBFEB04BBFF642E86;
sub.f64 fd383, fd381, fd382;
mul.f64 fd384, fd180, 0d3FE1257E3C182B51;
fma.rn.f64 fd385, fd162, 0dBFEB04BBFF642E86, fd384;
mul.f64 fd386, fd206, 0dBFDB3FF7C925819C;
mul.f64 fd387, fd224, 0dBFECF457DCDC158C;
sub.f64 fd388, fd386, fd387;
mul.f64 fd389, fd224, 0dBFDB3FF7C925819C;
fma.rn.f64 fd390, fd206, 0dBFECF457DCDC158C, fd389;
mul.f64 fd391, fd250, 0dBFEFBF675480D903;
mul.f64 fd392, fd268, 0dBFC00AEB5DA15BE0;
sub.f64 fd393, fd391, fd392;
mul.f64 fd394, fd268, 0dBFEFBF675480D903;
fma.rn.f64 fd395, fd250, 0dBFC00AEB5DA15BE0, fd394;
mul.f64 fd396, fd294, 0dBFE465C6FEB501BC;
mul.f64 fd397, fd312, 0d3FE8A80B635B6BEA;
sub.f64 fd398, fd396, fd397;
mul.f64 fd399, fd312, 0dBFE465C6FEB501BC;
fma.rn.f64 fd400, fd294, 0d3FE8A80B635B6BEA, fd399;
add.f64 fd401, fd148, fd280;
add.f64 fd402, fd104, fd401;
add.f64 fd403, fd192, fd236;
add.f64 fd404, fd403, fd402;
add.f64 fd405, fd152, fd284;
add.f64 fd406, fd108, fd405;
add.f64 fd407, fd196, fd240;
add.f64 fd408, fd407, fd406;
fma.rn.f64 fd409, fd401, 0d3FD3C6EF372FE950, fd104;
mul.f64 fd410, fd403, 0d3FE9E3779B97F4A8;
sub.f64 fd411, fd409, fd410;
sub.f64 fd412, fd152, fd284;
mul.f64 fd413, fd412, 0d3FEE6F0E134454FF;
sub.f64 fd414, fd196, fd240;
mul.f64 fd415, fd414, 0dBFE2CF2304755A5E;
sub.f64 fd416, fd415, fd413;
sub.f64 fd417, fd411, fd416;
add.f64 fd418, fd416, fd411;
mul.f64 fd419, fd401, 0d3FE9E3779B97F4A8;
sub.f64 fd420, fd104, fd419;
fma.rn.f64 fd421, fd403, 0d3FD3C6EF372FE950, fd420;
mul.f64 fd422, fd412, 0d3FE2CF2304755A5E;
mul.f64 fd423, fd414, 0d3FEE6F0E134454FF;
sub.f64 fd424, fd423, fd422;
sub.f64 fd425, fd421, fd424;
add.f64 fd426, fd424, fd421;
fma.rn.f64 fd427, fd405, 0d3FD3C6EF372FE950, fd108;
mul.f64 fd428, fd407, 0d3FE9E3779B97F4A8;
sub.f64 fd429, fd427, fd428;
sub.f64 fd430, fd148, fd280;
mul.f64 fd431, fd430, 0d3FEE6F0E134454FF;
sub.f64 fd432, fd192, fd236;
mul.f64 fd433, fd432, 0dBFE2CF2304755A5E;
sub.f64 fd434, fd433, fd431;
add.f64 fd435, fd434, fd429;
sub.f64 fd436, fd429, fd434;
mul.f64 fd437, fd405, 0d3FE9E3779B97F4A8;
sub.f64 fd438, fd108, fd437;
fma.rn.f64 fd439, fd407, 0d3FD3C6EF372FE950, fd438;
mul.f64 fd440, fd430, 0d3FE2CF2304755A5E;
mul.f64 fd441, fd432, 0d3FEE6F0E134454FF;
sub.f64 fd442, fd441, fd440;
add.f64 fd443, fd442, fd439;
sub.f64 fd444, fd439, fd442;
add.f64 fd445, fd323, fd338;
add.f64 fd446, fd117, fd445;
add.f64 fd447, fd328, fd333;
add.f64 fd448, fd447, fd446;
add.f64 fd449, fd325, fd340;
add.f64 fd450, fd135, fd449;
add.f64 fd451, fd330, fd335;
add.f64 fd452, fd451, fd450;
fma.rn.f64 fd453, fd445, 0d3FD3C6EF372FE950, fd117;
mul.f64 fd454, fd447, 0d3FE9E3779B97F4A8;
sub.f64 fd455, fd453, fd454;
sub.f64 fd456, fd325, fd340;
mul.f64 fd457, fd456, 0d3FEE6F0E134454FF;
sub.f64 fd458, fd330, fd335;
mul.f64 fd459, fd458, 0dBFE2CF2304755A5E;
sub.f64 fd460, fd459, fd457;
sub.f64 fd461, fd455, fd460;
add.f64 fd462, fd460, fd455;
mul.f64 fd463, fd445, 0d3FE9E3779B97F4A8;
sub.f64 fd464, fd117, fd463;
fma.rn.f64 fd465, fd447, 0d3FD3C6EF372FE950, fd464;
mul.f64 fd466, fd456, 0d3FE2CF2304755A5E;
mul.f64 fd467, fd458, 0d3FEE6F0E134454FF;
sub.f64 fd468, fd467, fd466;
sub.f64 fd469, fd465, fd468;
add.f64 fd470, fd468, fd465;
fma.rn.f64 fd471, fd449, 0d3FD3C6EF372FE950, fd135;
mul.f64 fd472, fd451, 0d3FE9E3779B97F4A8;
sub.f64 fd473, fd471, fd472;
sub.f64 fd474, fd323, fd338;
mul.f64 fd475, fd474, 0d3FEE6F0E134454FF;
sub.f64 fd476, fd328, fd333;
mul.f64 fd477, fd476, 0dBFE2CF2304755A5E;
sub.f64 fd478, fd477, fd475;
add.f64 fd479, fd478, fd473;
sub.f64 fd480, fd473, fd478;
mul.f64 fd481, fd449, 0d3FE9E3779B97F4A8;
sub.f64 fd482, fd135, fd481;
fma.rn.f64 fd483, fd451, 0d3FD3C6EF372FE950, fd482;
mul.f64 fd484, fd474, 0d3FE2CF2304755A5E;
mul.f64 fd485, fd476, 0d3FEE6F0E134454FF;
sub.f64 fd486, fd485, fd484;
add.f64 fd487, fd486, fd483;
sub.f64 fd488, fd483, fd486;
add.f64 fd489, fd343, fd358;
add.f64 fd490, fd125, fd489;
add.f64 fd491, fd348, fd353;
add.f64 fd492, fd491, fd490;
add.f64 fd493, fd345, fd360;
add.f64 fd494, fd143, fd493;
add.f64 fd495, fd350, fd355;
add.f64 fd496, fd495, fd494;
fma.rn.f64 fd497, fd489, 0d3FD3C6EF372FE950, fd125;
mul.f64 fd498, fd491, 0d3FE9E3779B97F4A8;
sub.f64 fd499, fd497, fd498;
sub.f64 fd500, fd345, fd360;
mul.f64 fd501, fd500, 0d3FEE6F0E134454FF;
sub.f64 fd502, fd350, fd355;
mul.f64 fd503, fd502, 0dBFE2CF2304755A5E;
sub.f64 fd504, fd503, fd501;
sub.f64 fd505, fd499, fd504;
add.f64 fd506, fd504, fd499;
mul.f64 fd507, fd489, 0d3FE9E3779B97F4A8;
sub.f64 fd508, fd125, fd507;
fma.rn.f64 fd509, fd491, 0d3FD3C6EF372FE950, fd508;
mul.f64 fd510, fd500, 0d3FE2CF2304755A5E;
mul.f64 fd511, fd502, 0d3FEE6F0E134454FF;
sub.f64 fd512, fd511, fd510;
sub.f64 fd513, fd509, fd512;
add.f64 fd514, fd512, fd509;
fma.rn.f64 fd515, fd493, 0d3FD3C6EF372FE950, fd143;
mul.f64 fd516, fd495, 0d3FE9E3779B97F4A8;
sub.f64 fd517, fd515, fd516;
sub.f64 fd518, fd343, fd358;
mul.f64 fd519, fd518, 0d3FEE6F0E134454FF;
sub.f64 fd520, fd348, fd353;
mul.f64 fd521, fd520, 0dBFE2CF2304755A5E;
sub.f64 fd522, fd521, fd519;
add.f64 fd523, fd522, fd517;
sub.f64 fd524, fd517, fd522;
mul.f64 fd525, fd493, 0d3FE9E3779B97F4A8;
sub.f64 fd526, fd143, fd525;
fma.rn.f64 fd527, fd495, 0d3FD3C6EF372FE950, fd526;
mul.f64 fd528, fd518, 0d3FE2CF2304755A5E;
mul.f64 fd529, fd520, 0d3FEE6F0E134454FF;
sub.f64 fd530, fd529, fd528;
add.f64 fd531, fd530, fd527;
sub.f64 fd532, fd527, fd530;
add.f64 fd533, fd363, fd378;
add.f64 fd534, fd126, fd533;
add.f64 fd535, fd368, fd373;
add.f64 fd536, fd535, fd534;
add.f64 fd537, fd365, fd380;
add.f64 fd538, fd144, fd537;
add.f64 fd539, fd370, fd375;
add.f64 fd540, fd539, fd538;
fma.rn.f64 fd541, fd533, 0d3FD3C6EF372FE950, fd126;
mul.f64 fd542, fd535, 0d3FE9E3779B97F4A8;
sub.f64 fd543, fd541, fd542;
sub.f64 fd544, fd365, fd380;
mul.f64 fd545, fd544, 0d3FEE6F0E134454FF;
sub.f64 fd546, fd370, fd375;
mul.f64 fd547, fd546, 0dBFE2CF2304755A5E;
sub.f64 fd548, fd547, fd545;
sub.f64 fd549, fd543, fd548;
add.f64 fd550, fd548, fd543;
mul.f64 fd551, fd533, 0d3FE9E3779B97F4A8;
sub.f64 fd552, fd126, fd551;
fma.rn.f64 fd553, fd535, 0d3FD3C6EF372FE950, fd552;
mul.f64 fd554, fd544, 0d3FE2CF2304755A5E;
mul.f64 fd555, fd546, 0d3FEE6F0E134454FF;
sub.f64 fd556, fd555, fd554;
sub.f64 fd557, fd553, fd556;
add.f64 fd558, fd556, fd553;
fma.rn.f64 fd559, fd537, 0d3FD3C6EF372FE950, fd144;
mul.f64 fd560, fd539, 0d3FE9E3779B97F4A8;
sub.f64 fd561, fd559, fd560;
sub.f64 fd562, fd363, fd378;
mul.f64 fd563, fd562, 0d3FEE6F0E134454FF;
sub.f64 fd564, fd368, fd373;
mul.f64 fd565, fd564, 0dBFE2CF2304755A5E;
sub.f64 fd566, fd565, fd563;
add.f64 fd567, fd566, fd561;
sub.f64 fd568, fd561, fd566;
mul.f64 fd569, fd537, 0d3FE9E3779B97F4A8;
sub.f64 fd570, fd144, fd569;
fma.rn.f64 fd571, fd539, 0d3FD3C6EF372FE950, fd570;
mul.f64 fd572, fd562, 0d3FE2CF2304755A5E;
mul.f64 fd573, fd564, 0d3FEE6F0E134454FF;
sub.f64 fd574, fd573, fd572;
add.f64 fd575, fd574, fd571;
sub.f64 fd576, fd571, fd574;
add.f64 fd577, fd383, fd398;
add.f64 fd578, fd118, fd577;
add.f64 fd579, fd388, fd393;
add.f64 fd580, fd579, fd578;
add.f64 fd581, fd385, fd400;
add.f64 fd582, fd136, fd581;
add.f64 fd583, fd390, fd395;
add.f64 fd584, fd583, fd582;
fma.rn.f64 fd585, fd577, 0d3FD3C6EF372FE950, fd118;
mul.f64 fd586, fd579, 0d3FE9E3779B97F4A8;
sub.f64 fd587, fd585, fd586;
sub.f64 fd588, fd385, fd400;
mul.f64 fd589, fd588, 0d3FEE6F0E134454FF;
sub.f64 fd590, fd390, fd395;
mul.f64 fd591, fd590, 0dBFE2CF2304755A5E;
sub.f64 fd592, fd591, fd589;
sub.f64 fd593, fd587, fd592;
add.f64 fd594, fd592, fd587;
mul.f64 fd595, fd577, 0d3FE9E3779B97F4A8;
sub.f64 fd596, fd118, fd595;
fma.rn.f64 fd597, fd579, 0d3FD3C6EF372FE950, fd596;
mul.f64 fd598, fd588, 0d3FE2CF2304755A5E;
mul.f64 fd599, fd590, 0d3FEE6F0E134454FF;
sub.f64 fd600, fd599, fd598;
sub.f64 fd601, fd597, fd600;
add.f64 fd602, fd600, fd597;
fma.rn.f64 fd603, fd581, 0d3FD3C6EF372FE950, fd136;
mul.f64 fd604, fd583, 0d3FE9E3779B97F4A8;
sub.f64 fd605, fd603, fd604;
sub.f64 fd606, fd383, fd398;
mul.f64 fd607, fd606, 0d3FEE6F0E134454FF;
sub.f64 fd608, fd388, fd393;
mul.f64 fd609, fd608, 0dBFE2CF2304755A5E;
sub.f64 fd610, fd609, fd607;
add.f64 fd611, fd610, fd605;
sub.f64 fd612, fd605, fd610;
mul.f64 fd613, fd581, 0d3FE9E3779B97F4A8;
sub.f64 fd614, fd136, fd613;
fma.rn.f64 fd615, fd583, 0d3FD3C6EF372FE950, fd614;
mul.f64 fd616, fd606, 0d3FE2CF2304755A5E;
mul.f64 fd617, fd608, 0d3FEE6F0E134454FF;
sub.f64 fd618, fd617, fd616;
add.f64 fd619, fd618, fd615;
sub.f64 fd620, fd615, fd618;
mul.wide.u32 rd2, r4, 1374389535;
shr.u64 rd3, rd2, 35;
cvt.u32.u64 r5, rd3;
mul.lo.s32 r6, r5, 25;
sub.s32 r7, r4, r6;
mul.wide.u32 rd4, r7, 16;
mov.u64 rd5, %51;
add.s64 rd6, rd5, rd4;
ld.global.v2.f64 {fd621, fd622}, [rd6];
mul.f64 fd625, fd621, fd448;
mul.f64 fd626, fd622, fd452;
sub.f64 fd627, fd625, fd626;
mul.f64 fd628, fd621, fd452;
fma.rn.f64 fd629, fd622, fd448, fd628;
mul.f64 fd630, fd621, fd621;
mul.f64 fd631, fd622, fd622;
sub.f64 fd632, fd630, fd631;
mul.f64 fd633, fd622, fd621;
fma.rn.f64 fd634, fd622, fd621, fd633;
mul.f64 fd635, fd632, fd492;
mul.f64 fd636, fd634, fd496;
sub.f64 fd637, fd635, fd636;
mul.f64 fd638, fd632, fd496;
fma.rn.f64 fd639, fd634, fd492, fd638;
mul.f64 fd640, fd621, fd632;
mul.f64 fd641, fd622, fd634;
sub.f64 fd642, fd640, fd641;
mul.f64 fd643, fd621, fd634;
fma.rn.f64 fd644, fd622, fd632, fd643;
mul.f64 fd645, fd642, fd536;
mul.f64 fd646, fd644, fd540;
sub.f64 fd647, fd645, fd646;
mul.f64 fd648, fd642, fd540;
fma.rn.f64 fd649, fd644, fd536, fd648;
mul.f64 fd650, fd621, fd642;
mul.f64 fd651, fd622, fd644;
sub.f64 fd652, fd650, fd651;
mul.f64 fd653, fd621, fd644;
fma.rn.f64 fd654, fd622, fd642, fd653;
mul.f64 fd655, fd652, fd580;
mul.f64 fd656, fd654, fd584;
sub.f64 fd657, fd655, fd656;
mul.f64 fd658, fd652, fd584;
fma.rn.f64 fd659, fd654, fd580, fd658;
mul.f64 fd660, fd621, fd652;
mul.f64 fd661, fd622, fd654;
sub.f64 fd662, fd660, fd661;
mul.f64 fd663, fd621, fd654;
fma.rn.f64 fd664, fd622, fd652, fd663;
mul.f64 fd665, fd662, fd417;
mul.f64 fd666, fd664, fd435;
sub.f64 fd667, fd665, fd666;
mul.f64 fd668, fd662, fd435;
fma.rn.f64 fd669, fd664, fd417, fd668;
mul.f64 fd670, fd621, fd662;
mul.f64 fd671, fd622, fd664;
sub.f64 fd672, fd670, fd671;
mul.f64 fd673, fd621, fd664;
fma.rn.f64 fd674, fd622, fd662, fd673;
mul.f64 fd675, fd672, fd461;
mul.f64 fd676, fd674, fd479;
sub.f64 fd677, fd675, fd676;
mul.f64 fd678, fd672, fd479;
fma.rn.f64 fd679, fd674, fd461, fd678;
mul.f64 fd680, fd621, fd672;
mul.f64 fd681, fd622, fd674;
sub.f64 fd682, fd680, fd681;
mul.f64 fd683, fd621, fd674;
fma.rn.f64 fd684, fd622, fd672, fd683;
mul.f64 fd685, fd682, fd505;
mul.f64 fd686, fd684, fd523;
sub.f64 fd687, fd685, fd686;
mul.f64 fd688, fd682, fd523;
fma.rn.f64 fd689, fd684, fd505, fd688;
mul.f64 fd690, fd621, fd682;
mul.f64 fd691, fd622, fd684;
sub.f64 fd692, fd690, fd691;
mul.f64 fd693, fd621, fd684;
fma.rn.f64 fd694, fd622, fd682, fd693;
mul.f64 fd695, fd692, fd549;
mul.f64 fd696, fd694, fd567;
sub.f64 fd697, fd695, fd696;
mul.f64 fd698, fd692, fd567;
fma.rn.f64 fd699, fd694, fd549, fd698;
mul.f64 fd700, fd621, fd692;
mul.f64 fd701, fd622, fd694;
sub.f64 fd702, fd700, fd701;
mul.f64 fd703, fd621, fd694;
fma.rn.f64 fd704, fd622, fd692, fd703;
mul.f64 fd705, fd702, fd593;
mul.f64 fd706, fd704, fd611;
sub.f64 fd707, fd705, fd706;
mul.f64 fd708, fd702, fd611;
fma.rn.f64 fd709, fd704, fd593, fd708;
mul.f64 fd710, fd621, fd702;
mul.f64 fd711, fd622, fd704;
sub.f64 fd712, fd710, fd711;
mul.f64 fd713, fd621, fd704;
fma.rn.f64 fd714, fd622, fd702, fd713;
mul.f64 fd715, fd712, fd425;
mul.f64 fd716, fd714, fd443;
sub.f64 fd717, fd715, fd716;
mul.f64 fd718, fd712, fd443;
fma.rn.f64 fd719, fd714, fd425, fd718;
mul.f64 fd720, fd621, fd712;
mul.f64 fd721, fd622, fd714;
sub.f64 fd722, fd720, fd721;
mul.f64 fd723, fd621, fd714;
fma.rn.f64 fd724, fd622, fd712, fd723;
mul.f64 fd725, fd722, fd469;
mul.f64 fd726, fd724, fd487;
sub.f64 fd727, fd725, fd726;
mul.f64 fd728, fd722, fd487;
fma.rn.f64 fd729, fd724, fd469, fd728;
mul.f64 fd730, fd621, fd722;
mul.f64 fd731, fd622, fd724;
sub.f64 fd732, fd730, fd731;
mul.f64 fd733, fd621, fd724;
fma.rn.f64 fd734, fd622, fd722, fd733;
mul.f64 fd735, fd732, fd513;
mul.f64 fd736, fd734, fd531;
sub.f64 fd737, fd735, fd736;
mul.f64 fd738, fd732, fd531;
fma.rn.f64 fd739, fd734, fd513, fd738;
ld.global.v2.f64 {fd740, fd741}, [rd6+400];
mul.f64 fd744, fd740, fd557;
mul.f64 fd745, fd741, fd575;
sub.f64 fd746, fd744, fd745;
mul.f64 fd747, fd740, fd575;
fma.rn.f64 fd748, fd741, fd557, fd747;
mul.f64 fd749, fd621, fd740;
mul.f64 fd750, fd622, fd741;
sub.f64 fd751, fd749, fd750;
mul.f64 fd752, fd621, fd741;
fma.rn.f64 fd753, fd622, fd740, fd752;
mul.f64 fd754, fd751, fd601;
mul.f64 fd755, fd753, fd619;
sub.f64 fd756, fd754, fd755;
mul.f64 fd757, fd751, fd619;
fma.rn.f64 fd758, fd753, fd601, fd757;
mul.f64 fd759, fd621, fd751;
mul.f64 fd760, fd622, fd753;
sub.f64 fd761, fd759, fd760;
mul.f64 fd762, fd621, fd753;
fma.rn.f64 fd763, fd622, fd751, fd762;
mul.f64 fd764, fd761, fd426;
mul.f64 fd765, fd763, fd444;
sub.f64 fd766, fd764, fd765;
mul.f64 fd767, fd761, fd444;
fma.rn.f64 fd768, fd763, fd426, fd767;
mul.f64 fd769, fd621, fd761;
mul.f64 fd770, fd622, fd763;
sub.f64 fd771, fd769, fd770;
mul.f64 fd772, fd621, fd763;
fma.rn.f64 fd773, fd622, fd761, fd772;
mul.f64 fd774, fd771, fd470;
mul.f64 fd775, fd773, fd488;
sub.f64 fd776, fd774, fd775;
mul.f64 fd777, fd771, fd488;
fma.rn.f64 fd778, fd773, fd470, fd777;
mul.f64 fd779, fd621, fd771;
mul.f64 fd780, fd622, fd773;
sub.f64 fd781, fd779, fd780;
mul.f64 fd782, fd621, fd773;
fma.rn.f64 fd783, fd622, fd771, fd782;
mul.f64 fd784, fd781, fd514;
mul.f64 fd785, fd783, fd532;
sub.f64 fd786, fd784, fd785;
mul.f64 fd787, fd781, fd532;
fma.rn.f64 fd788, fd783, fd514, fd787;
mul.f64 fd789, fd621, fd781;
mul.f64 fd790, fd622, fd783;
sub.f64 fd791, fd789, fd790;
mul.f64 fd792, fd621, fd783;
fma.rn.f64 fd793, fd622, fd781, fd792;
mul.f64 fd794, fd791, fd558;
mul.f64 fd795, fd793, fd576;
sub.f64 fd796, fd794, fd795;
mul.f64 fd797, fd791, fd576;
fma.rn.f64 fd798, fd793, fd558, fd797;
mul.f64 fd799, fd621, fd791;
mul.f64 fd800, fd622, fd793;
sub.f64 fd801, fd799, fd800;
mul.f64 fd802, fd621, fd793;
fma.rn.f64 fd803, fd622, fd791, fd802;
mul.f64 fd804, fd801, fd602;
mul.f64 fd805, fd803, fd620;
sub.f64 fd806, fd804, fd805;
mul.f64 fd807, fd801, fd620;
fma.rn.f64 fd808, fd803, fd602, fd807;
mul.f64 fd809, fd621, fd801;
mul.f64 fd810, fd622, fd803;
sub.f64 fd811, fd809, fd810;
mul.f64 fd812, fd621, fd803;
fma.rn.f64 fd813, fd622, fd801, fd812;
mul.f64 fd814, fd811, fd418;
mul.f64 fd815, fd813, fd436;
sub.f64 fd816, fd814, fd815;
mul.f64 fd817, fd811, fd436;
fma.rn.f64 fd818, fd813, fd418, fd817;
mul.f64 fd819, fd621, fd811;
mul.f64 fd820, fd622, fd813;
sub.f64 fd821, fd819, fd820;
mul.f64 fd822, fd621, fd813;
fma.rn.f64 fd823, fd622, fd811, fd822;
mul.f64 fd824, fd821, fd462;
mul.f64 fd825, fd823, fd480;
sub.f64 fd826, fd824, fd825;
mul.f64 fd827, fd821, fd480;
fma.rn.f64 fd828, fd823, fd462, fd827;
mul.f64 fd829, fd621, fd821;
mul.f64 fd830, fd622, fd823;
sub.f64 fd831, fd829, fd830;
mul.f64 fd832, fd621, fd823;
fma.rn.f64 fd833, fd622, fd821, fd832;
mul.f64 fd834, fd831, fd506;
mul.f64 fd835, fd833, fd524;
sub.f64 fd836, fd834, fd835;
mul.f64 fd837, fd831, fd524;
fma.rn.f64 fd838, fd833, fd506, fd837;
mul.f64 fd839, fd621, fd831;
mul.f64 fd840, fd622, fd833;
sub.f64 fd841, fd839, fd840;
mul.f64 fd842, fd621, fd833;
fma.rn.f64 fd843, fd622, fd831, fd842;
mul.f64 fd844, fd841, fd550;
mul.f64 fd845, fd843, fd568;
sub.f64 fd846, fd844, fd845;
mul.f64 fd847, fd841, fd568;
fma.rn.f64 fd848, fd843, fd550, fd847;
mul.f64 fd849, fd621, fd841;
mul.f64 fd850, fd622, fd843;
sub.f64 fd851, fd849, fd850;
mul.f64 fd852, fd621, fd843;
fma.rn.f64 fd853, fd622, fd841, fd852;
mul.f64 fd854, fd851, fd594;
mul.f64 fd855, fd853, fd612;
sub.f64 fd856, fd854, fd855;
mul.f64 fd857, fd851, fd612;
fma.rn.f64 fd858, fd853, fd594, fd857;
mad.lo.s32 r8, r5, 5000, r3;
barrier.sync 0;
mad.lo.s32 r9, r7, 200, r8;
st.shared.f64 [r9], fd404;
st.shared.f64 [r9+8], fd627;
st.shared.f64 [r9+16], fd637;
st.shared.f64 [r9+24], fd647;
st.shared.f64 [r9+32], fd657;
st.shared.f64 [r9+40], fd667;
st.shared.f64 [r9+48], fd677;
st.shared.f64 [r9+56], fd687;
st.shared.f64 [r9+64], fd697;
st.shared.f64 [r9+72], fd707;
st.shared.f64 [r9+80], fd717;
st.shared.f64 [r9+88], fd727;
st.shared.f64 [r9+96], fd737;
st.shared.f64 [r9+104], fd746;
st.shared.f64 [r9+112], fd756;
st.shared.f64 [r9+120], fd766;
st.shared.f64 [r9+128], fd776;
st.shared.f64 [r9+136], fd786;
st.shared.f64 [r9+144], fd796;
st.shared.f64 [r9+152], fd806;
st.shared.f64 [r9+160], fd816;
st.shared.f64 [r9+168], fd826;
st.shared.f64 [r9+176], fd836;
st.shared.f64 [r9+184], fd846;
st.shared.f64 [r9+192], fd856;
barrier.sync 0;
mad.lo.s32 r10, r7, -192, r9;
ld.shared.f64 fd859, [r10];
ld.shared.f64 fd860, [r10+200];
ld.shared.f64 fd861, [r10+400];
ld.shared.f64 fd862, [r10+600];
ld.shared.f64 fd863, [r10+800];
ld.shared.f64 fd864, [r10+1000];
ld.shared.f64 fd865, [r10+1200];
ld.shared.f64 fd866, [r10+1400];
ld.shared.f64 fd867, [r10+1600];
ld.shared.f64 fd868, [r10+1800];
ld.shared.f64 fd869, [r10+2000];
ld.shared.f64 fd870, [r10+2200];
ld.shared.f64 fd871, [r10+2400];
ld.shared.f64 fd872, [r10+2600];
ld.shared.f64 fd873, [r10+2800];
ld.shared.f64 fd874, [r10+3000];
ld.shared.f64 fd875, [r10+3200];
ld.shared.f64 fd876, [r10+3400];
ld.shared.f64 fd877, [r10+3600];
ld.shared.f64 fd878, [r10+3800];
ld.shared.f64 fd879, [r10+4000];
ld.shared.f64 fd880, [r10+4200];
ld.shared.f64 fd881, [r10+4400];
ld.shared.f64 fd882, [r10+4600];
ld.shared.f64 fd883, [r10+4800];
barrier.sync 0;
st.shared.f64 [r9], fd408;
st.shared.f64 [r9+8], fd629;
st.shared.f64 [r9+16], fd639;
st.shared.f64 [r9+24], fd649;
st.shared.f64 [r9+32], fd659;
st.shared.f64 [r9+40], fd669;
st.shared.f64 [r9+48], fd679;
st.shared.f64 [r9+56], fd689;
st.shared.f64 [r9+64], fd699;
st.shared.f64 [r9+72], fd709;
st.shared.f64 [r9+80], fd719;
st.shared.f64 [r9+88], fd729;
st.shared.f64 [r9+96], fd739;
st.shared.f64 [r9+104], fd748;
st.shared.f64 [r9+112], fd758;
st.shared.f64 [r9+120], fd768;
st.shared.f64 [r9+128], fd778;
st.shared.f64 [r9+136], fd788;
st.shared.f64 [r9+144], fd798;
st.shared.f64 [r9+152], fd808;
st.shared.f64 [r9+160], fd818;
st.shared.f64 [r9+168], fd828;
st.shared.f64 [r9+176], fd838;
st.shared.f64 [r9+184], fd848;
st.shared.f64 [r9+192], fd858;
barrier.sync 0;
ld.shared.f64 fd884, [r10];
ld.shared.f64 fd885, [r10+200];
ld.shared.f64 fd886, [r10+400];
ld.shared.f64 fd887, [r10+600];
ld.shared.f64 fd888, [r10+800];
ld.shared.f64 fd889, [r10+1000];
ld.shared.f64 fd890, [r10+1200];
ld.shared.f64 fd891, [r10+1400];
ld.shared.f64 fd892, [r10+1600];
ld.shared.f64 fd893, [r10+1800];
ld.shared.f64 fd894, [r10+2000];
ld.shared.f64 fd895, [r10+2200];
ld.shared.f64 fd896, [r10+2400];
ld.shared.f64 fd897, [r10+2600];
ld.shared.f64 fd898, [r10+2800];
ld.shared.f64 fd899, [r10+3000];
ld.shared.f64 fd900, [r10+3200];
ld.shared.f64 fd901, [r10+3400];
ld.shared.f64 fd902, [r10+3600];
ld.shared.f64 fd903, [r10+3800];
ld.shared.f64 fd904, [r10+4000];
ld.shared.f64 fd905, [r10+4200];
ld.shared.f64 fd906, [r10+4400];
ld.shared.f64 fd907, [r10+4600];
ld.shared.f64 fd908, [r10+4800];
add.f64 fd909, fd864, fd879;
add.f64 fd910, fd859, fd909;
add.f64 fd911, fd869, fd874;
add.f64 fd912, fd911, fd910;
add.f64 fd913, fd889, fd904;
add.f64 fd914, fd884, fd913;
add.f64 fd915, fd894, fd899;
add.f64 fd916, fd915, fd914;
fma.rn.f64 fd917, fd909, 0d3FD3C6EF372FE950, fd859;
mul.f64 fd918, fd911, 0d3FE9E3779B97F4A8;
sub.f64 fd919, fd917, fd918;
sub.f64 fd920, fd889, fd904;
mul.f64 fd921, fd920, 0d3FEE6F0E134454FF;
sub.f64 fd922, fd894, fd899;
mul.f64 fd923, fd922, 0dBFE2CF2304755A5E;
sub.f64 fd924, fd923, fd921;
sub.f64 fd925, fd919, fd924;
add.f64 fd926, fd924, fd919;
mul.f64 fd927, fd909, 0d3FE9E3779B97F4A8;
sub.f64 fd928, fd859, fd927;
fma.rn.f64 fd929, fd911, 0d3FD3C6EF372FE950, fd928;
mul.f64 fd930, fd920, 0d3FE2CF2304755A5E;
mul.f64 fd931, fd922, 0d3FEE6F0E134454FF;
sub.f64 fd932, fd931, fd930;
sub.f64 fd933, fd929, fd932;
add.f64 fd934, fd932, fd929;
fma.rn.f64 fd935, fd913, 0d3FD3C6EF372FE950, fd884;
mul.f64 fd936, fd915, 0d3FE9E3779B97F4A8;
sub.f64 fd937, fd935, fd936;
sub.f64 fd938, fd864, fd879;
mul.f64 fd939, fd938, 0d3FEE6F0E134454FF;
sub.f64 fd940, fd869, fd874;
mul.f64 fd941, fd940, 0dBFE2CF2304755A5E;
sub.f64 fd942, fd941, fd939;
add.f64 fd943, fd942, fd937;
sub.f64 fd944, fd937, fd942;
mul.f64 fd945, fd913, 0d3FE9E3779B97F4A8;
sub.f64 fd946, fd884, fd945;
fma.rn.f64 fd947, fd915, 0d3FD3C6EF372FE950, fd946;
mul.f64 fd948, fd938, 0d3FE2CF2304755A5E;
mul.f64 fd949, fd940, 0d3FEE6F0E134454FF;
sub.f64 fd950, fd949, fd948;
add.f64 fd951, fd950, fd947;
sub.f64 fd952, fd947, fd950;
add.f64 fd953, fd865, fd880;
add.f64 fd954, fd860, fd953;
add.f64 fd955, fd870, fd875;
add.f64 fd956, fd955, fd954;
add.f64 fd957, fd890, fd905;
add.f64 fd958, fd885, fd957;
add.f64 fd959, fd895, fd900;
add.f64 fd960, fd959, fd958;
fma.rn.f64 fd961, fd953, 0d3FD3C6EF372FE950, fd860;
mul.f64 fd962, fd955, 0d3FE9E3779B97F4A8;
sub.f64 fd963, fd961, fd962;
sub.f64 fd964, fd890, fd905;
mul.f64 fd965, fd964, 0d3FEE6F0E134454FF;
sub.f64 fd966, fd895, fd900;
mul.f64 fd967, fd966, 0dBFE2CF2304755A5E;
sub.f64 fd968, fd967, fd965;
sub.f64 fd969, fd963, fd968;
add.f64 fd970, fd968, fd963;
mul.f64 fd971, fd953, 0d3FE9E3779B97F4A8;
sub.f64 fd972, fd860, fd971;
fma.rn.f64 fd973, fd955, 0d3FD3C6EF372FE950, fd972;
mul.f64 fd974, fd964, 0d3FE2CF2304755A5E;
mul.f64 fd975, fd966, 0d3FEE6F0E134454FF;
sub.f64 fd976, fd975, fd974;
sub.f64 fd977, fd973, fd976;
add.f64 fd978, fd976, fd973;
fma.rn.f64 fd979, fd957, 0d3FD3C6EF372FE950, fd885;
mul.f64 fd980, fd959, 0d3FE9E3779B97F4A8;
sub.f64 fd981, fd979, fd980;
sub.f64 fd982, fd865, fd880;
mul.f64 fd983, fd982, 0d3FEE6F0E134454FF;
sub.f64 fd984, fd870, fd875;
mul.f64 fd985, fd984, 0dBFE2CF2304755A5E;
sub.f64 fd986, fd985, fd983;
add.f64 fd987, fd986, fd981;
sub.f64 fd988, fd981, fd986;
mul.f64 fd989, fd957, 0d3FE9E3779B97F4A8;
sub.f64 fd990, fd885, fd989;
fma.rn.f64 fd991, fd959, 0d3FD3C6EF372FE950, fd990;
mul.f64 fd992, fd982, 0d3FE2CF2304755A5E;
mul.f64 fd993, fd984, 0d3FEE6F0E134454FF;
sub.f64 fd994, fd993, fd992;
add.f64 fd995, fd994, fd991;
sub.f64 fd996, fd991, fd994;
add.f64 fd997, fd866, fd881;
add.f64 fd998, fd861, fd997;
add.f64 fd999, fd871, fd876;
add.f64 fd1000, fd999, fd998;
add.f64 fd1001, fd891, fd906;
add.f64 fd1002, fd886, fd1001;
add.f64 fd1003, fd896, fd901;
add.f64 fd1004, fd1003, fd1002;
fma.rn.f64 fd1005, fd997, 0d3FD3C6EF372FE950, fd861;
mul.f64 fd1006, fd999, 0d3FE9E3779B97F4A8;
sub.f64 fd1007, fd1005, fd1006;
sub.f64 fd1008, fd891, fd906;
mul.f64 fd1009, fd1008, 0d3FEE6F0E134454FF;
sub.f64 fd1010, fd896, fd901;
mul.f64 fd1011, fd1010, 0dBFE2CF2304755A5E;
sub.f64 fd1012, fd1011, fd1009;
sub.f64 fd1013, fd1007, fd1012;
add.f64 fd1014, fd1012, fd1007;
mul.f64 fd1015, fd997, 0d3FE9E3779B97F4A8;
sub.f64 fd1016, fd861, fd1015;
fma.rn.f64 fd1017, fd999, 0d3FD3C6EF372FE950, fd1016;
mul.f64 fd1018, fd1008, 0d3FE2CF2304755A5E;
mul.f64 fd1019, fd1010, 0d3FEE6F0E134454FF;
sub.f64 fd1020, fd1019, fd1018;
sub.f64 fd1021, fd1017, fd1020;
add.f64 fd1022, fd1020, fd1017;
fma.rn.f64 fd1023, fd1001, 0d3FD3C6EF372FE950, fd886;
mul.f64 fd1024, fd1003, 0d3FE9E3779B97F4A8;
sub.f64 fd1025, fd1023, fd1024;
sub.f64 fd1026, fd866, fd881;
mul.f64 fd1027, fd1026, 0d3FEE6F0E134454FF;
sub.f64 fd1028, fd871, fd876;
mul.f64 fd1029, fd1028, 0dBFE2CF2304755A5E;
sub.f64 fd1030, fd1029, fd1027;
add.f64 fd1031, fd1030, fd1025;
sub.f64 fd1032, fd1025, fd1030;
mul.f64 fd1033, fd1001, 0d3FE9E3779B97F4A8;
sub.f64 fd1034, fd886, fd1033;
fma.rn.f64 fd1035, fd1003, 0d3FD3C6EF372FE950, fd1034;
mul.f64 fd1036, fd1026, 0d3FE2CF2304755A5E;
mul.f64 fd1037, fd1028, 0d3FEE6F0E134454FF;
sub.f64 fd1038, fd1037, fd1036;
add.f64 fd1039, fd1038, fd1035;
sub.f64 fd1040, fd1035, fd1038;
add.f64 fd1041, fd867, fd882;
add.f64 fd1042, fd862, fd1041;
add.f64 fd1043, fd872, fd877;
add.f64 fd1044, fd1043, fd1042;
add.f64 fd1045, fd892, fd907;
add.f64 fd1046, fd887, fd1045;
add.f64 fd1047, fd897, fd902;
add.f64 fd1048, fd1047, fd1046;
fma.rn.f64 fd1049, fd1041, 0d3FD3C6EF372FE950, fd862;
mul.f64 fd1050, fd1043, 0d3FE9E3779B97F4A8;
sub.f64 fd1051, fd1049, fd1050;
sub.f64 fd1052, fd892, fd907;
mul.f64 fd1053, fd1052, 0d3FEE6F0E134454FF;
sub.f64 fd1054, fd897, fd902;
mul.f64 fd1055, fd1054, 0dBFE2CF2304755A5E;
sub.f64 fd1056, fd1055, fd1053;
sub.f64 fd1057, fd1051, fd1056;
add.f64 fd1058, fd1056, fd1051;
mul.f64 fd1059, fd1041, 0d3FE9E3779B97F4A8;
sub.f64 fd1060, fd862, fd1059;
fma.rn.f64 fd1061, fd1043, 0d3FD3C6EF372FE950, fd1060;
mul.f64 fd1062, fd1052, 0d3FE2CF2304755A5E;
mul.f64 fd1063, fd1054, 0d3FEE6F0E134454FF;
sub.f64 fd1064, fd1063, fd1062;
sub.f64 fd1065, fd1061, fd1064;
add.f64 fd1066, fd1064, fd1061;
fma.rn.f64 fd1067, fd1045, 0d3FD3C6EF372FE950, fd887;
mul.f64 fd1068, fd1047, 0d3FE9E3779B97F4A8;
sub.f64 fd1069, fd1067, fd1068;
sub.f64 fd1070, fd867, fd882;
mul.f64 fd1071, fd1070, 0d3FEE6F0E134454FF;
sub.f64 fd1072, fd872, fd877;
mul.f64 fd1073, fd1072, 0dBFE2CF2304755A5E;
sub.f64 fd1074, fd1073, fd1071;
add.f64 fd1075, fd1074, fd1069;
sub.f64 fd1076, fd1069, fd1074;
mul.f64 fd1077, fd1045, 0d3FE9E3779B97F4A8;
sub.f64 fd1078, fd887, fd1077;
fma.rn.f64 fd1079, fd1047, 0d3FD3C6EF372FE950, fd1078;
mul.f64 fd1080, fd1070, 0d3FE2CF2304755A5E;
mul.f64 fd1081, fd1072, 0d3FEE6F0E134454FF;
sub.f64 fd1082, fd1081, fd1080;
add.f64 fd1083, fd1082, fd1079;
sub.f64 fd1084, fd1079, fd1082;
add.f64 fd1085, fd868, fd883;
add.f64 fd1086, fd863, fd1085;
add.f64 fd1087, fd873, fd878;
add.f64 fd1088, fd1087, fd1086;
add.f64 fd1089, fd893, fd908;
add.f64 fd1090, fd888, fd1089;
add.f64 fd1091, fd898, fd903;
add.f64 fd1092, fd1091, fd1090;
fma.rn.f64 fd1093, fd1085, 0d3FD3C6EF372FE950, fd863;
mul.f64 fd1094, fd1087, 0d3FE9E3779B97F4A8;
sub.f64 fd1095, fd1093, fd1094;
sub.f64 fd1096, fd893, fd908;
mul.f64 fd1097, fd1096, 0d3FEE6F0E134454FF;
sub.f64 fd1098, fd898, fd903;
mul.f64 fd1099, fd1098, 0dBFE2CF2304755A5E;
sub.f64 fd1100, fd1099, fd1097;
sub.f64 fd1101, fd1095, fd1100;
add.f64 fd1102, fd1100, fd1095;
mul.f64 fd1103, fd1085, 0d3FE9E3779B97F4A8;
sub.f64 fd1104, fd863, fd1103;
fma.rn.f64 fd1105, fd1087, 0d3FD3C6EF372FE950, fd1104;
mul.f64 fd1106, fd1096, 0d3FE2CF2304755A5E;
mul.f64 fd1107, fd1098, 0d3FEE6F0E134454FF;
sub.f64 fd1108, fd1107, fd1106;
sub.f64 fd1109, fd1105, fd1108;
add.f64 fd1110, fd1108, fd1105;
fma.rn.f64 fd1111, fd1089, 0d3FD3C6EF372FE950, fd888;
mul.f64 fd1112, fd1091, 0d3FE9E3779B97F4A8;
sub.f64 fd1113, fd1111, fd1112;
sub.f64 fd1114, fd868, fd883;
mul.f64 fd1115, fd1114, 0d3FEE6F0E134454FF;
sub.f64 fd1116, fd873, fd878;
mul.f64 fd1117, fd1116, 0dBFE2CF2304755A5E;
sub.f64 fd1118, fd1117, fd1115;
add.f64 fd1119, fd1118, fd1113;
sub.f64 fd1120, fd1113, fd1118;
mul.f64 fd1121, fd1089, 0d3FE9E3779B97F4A8;
sub.f64 fd1122, fd888, fd1121;
fma.rn.f64 fd1123, fd1091, 0d3FD3C6EF372FE950, fd1122;
mul.f64 fd1124, fd1114, 0d3FE2CF2304755A5E;
mul.f64 fd1125, fd1116, 0d3FEE6F0E134454FF;
sub.f64 fd1126, fd1125, fd1124;
add.f64 fd1127, fd1126, fd1123;
sub.f64 fd1128, fd1123, fd1126;
mul.f64 fd1129, fd969, 0d3FEEFEA21D101EE0;
mul.f64 fd1130, fd987, 0dBFCFD511FA1C0796;
sub.f64 fd1131, fd1129, fd1130;
mul.f64 fd1132, fd987, 0d3FEEFEA21D101EE0;
fma.rn.f64 fd1133, fd969, 0dBFCFD511FA1C0796, fd1132;
mul.f64 fd1134, fd1013, 0d3FEC0AB44E81C059;
mul.f64 fd1135, fd1031, 0dBFDED50D5CBFA951;
sub.f64 fd1136, fd1134, fd1135;
mul.f64 fd1137, fd1031, 0d3FEC0AB44E81C059;
fma.rn.f64 fd1138, fd1013, 0dBFDED50D5CBFA951, fd1137;
mul.f64 fd1139, fd1057, 0d3FE753B603D2B816;
mul.f64 fd1140, fd1075, 0dBFE5E7CF55112014;
sub.f64 fd1141, fd1139, fd1140;
mul.f64 fd1142, fd1075, 0d3FE753B603D2B816;
fma.rn.f64 fd1143, fd1057, 0dBFE5E7CF55112014, fd1142;
mul.f64 fd1144, fd1101, 0d3FE1257E3C182B51;
mul.f64 fd1145, fd1119, 0dBFEB04BBFF642E86;
sub.f64 fd1146, fd1144, fd1145;
mul.f64 fd1147, fd1119, 0d3FE1257E3C182B51;
fma.rn.f64 fd1148, fd1101, 0dBFEB04BBFF642E86, fd1147;
mul.f64 fd1149, fd977, 0d3FEC0AB44E81C059;
mul.f64 fd1150, fd995, 0dBFDED50D5CBFA951;
sub.f64 fd1151, fd1149, fd1150;
mul.f64 fd1152, fd995, 0d3FEC0AB44E81C059;
fma.rn.f64 fd1153, fd977, 0dBFDED50D5CBFA951, fd1152;
mul.f64 fd1154, fd1021, 0d3FE1257E3C182B51;
mul.f64 fd1155, fd1039, 0dBFEB04BBFF642E86;
sub.f64 fd1156, fd1154, fd1155;
mul.f64 fd1157, fd1039, 0d3FE1257E3C182B51;
fma.rn.f64 fd1158, fd1021, 0dBFEB04BBFF642E86, fd1157;
mul.f64 fd1159, fd1065, 0d3FB0130A1BE09379;
mul.f64 fd1160, fd1083, 0dBFEFEFD5BFE443FE;
sub.f64 fd1161, fd1159, fd1160;
mul.f64 fd1162, fd1083, 0d3FB0130A1BE09379;
fma.rn.f64 fd1163, fd1065, 0dBFEFEFD5BFE443FE, fd1162;
mul.f64 fd1164, fd1109, 0dBFDB3FF7C925819C;
mul.f64 fd1165, fd1127, 0dBFECF457DCDC158C;
sub.f64 fd1166, fd1164, fd1165;
mul.f64 fd1167, fd1127, 0dBFDB3FF7C925819C;
fma.rn.f64 fd1168, fd1109, 0dBFECF457DCDC158C, fd1167;
mul.f64 fd1169, fd978, 0d3FE753B603D2B816;
mul.f64 fd1170, fd996, 0dBFE5E7CF55112014;
sub.f64 fd1171, fd1169, fd1170;
mul.f64 fd1172, fd996, 0d3FE753B603D2B816;
fma.rn.f64 fd1173, fd978, 0dBFE5E7CF55112014, fd1172;
mul.f64 fd1174, fd1022, 0d3FB0130A1BE09379;
mul.f64 fd1175, fd1040, 0dBFEFEFD5BFE443FE;
sub.f64 fd1176, fd1174, fd1175;
mul.f64 fd1177, fd1040, 0d3FB0130A1BE09379;
fma.rn.f64 fd1178, fd1022, 0dBFEFEFD5BFE443FE, fd1177;
mul.f64 fd1179, fd1066, 0dBFE465C6FEB501BC;
mul.f64 fd1180, fd1084, 0dBFE8A80B635B6BEA;
sub.f64 fd1181, fd1179, fd1180;
mul.f64 fd1182, fd1084, 0dBFE465C6FEB501BC;
fma.rn.f64 fd1183, fd1066, 0dBFE8A80B635B6BEA, fd1182;
mul.f64 fd1184, fd1110, 0dBFEFBF675480D903;
mul.f64 fd1185, fd1128, 0dBFC00AEB5DA15BE0;
sub.f64 fd1186, fd1184, fd1185;
mul.f64 fd1187, fd1128, 0dBFEFBF675480D903;
fma.rn.f64 fd1188, fd1110, 0dBFC00AEB5DA15BE0, fd1187;
mul.f64 fd1189, fd970, 0d3FE1257E3C182B51;
mul.f64 fd1190, fd988, 0dBFEB04BBFF642E86;
sub.f64 fd1191, fd1189, fd1190;
mul.f64 fd1192, fd988, 0d3FE1257E3C182B51;
fma.rn.f64 fd1193, fd970, 0dBFEB04BBFF642E86, fd1192;
mul.f64 fd1194, fd1014, 0dBFDB3FF7C925819C;
mul.f64 fd1195, fd1032, 0dBFECF457DCDC158C;
sub.f64 fd1196, fd1194, fd1195;
mul.f64 fd1197, fd1032, 0dBFDB3FF7C925819C;
fma.rn.f64 fd1198, fd1014, 0dBFECF457DCDC158C, fd1197;
mul.f64 fd1199, fd1058, 0dBFEFBF675480D903;
mul.f64 fd1200, fd1076, 0dBFC00AEB5DA15BE0;
sub.f64 fd1201, fd1199, fd1200;
mul.f64 fd1202, fd1076, 0dBFEFBF675480D903;
fma.rn.f64 fd1203, fd1058, 0dBFC00AEB5DA15BE0, fd1202;
mul.f64 fd1204, fd1102, 0dBFE465C6FEB501BC;
mul.f64 fd1205, fd1120, 0d3FE8A80B635B6BEA;
sub.f64 fd1206, fd1204, fd1205;
mul.f64 fd1207, fd1120, 0dBFE465C6FEB501BC;
fma.rn.f64 fd1208, fd1102, 0d3FE8A80B635B6BEA, fd1207;
add.f64 fd1209, fd956, fd1088;
add.f64 fd1210, fd912, fd1209;
add.f64 fd1211, fd1000, fd1044;
add.f64 fd1212, fd960, fd1092;
add.f64 fd1213, fd916, fd1212;
add.f64 fd1214, fd1004, fd1048;
fma.rn.f64 fd1215, fd1209, 0d3FD3C6EF372FE950, fd912;
mul.f64 fd1216, fd1211, 0d3FE9E3779B97F4A8;
sub.f64 fd1217, fd1215, fd1216;
sub.f64 fd1218, fd960, fd1092;
mul.f64 fd1219, fd1218, 0d3FEE6F0E134454FF;
sub.f64 fd1220, fd1004, fd1048;
mul.f64 fd1221, fd1220, 0dBFE2CF2304755A5E;
sub.f64 fd1222, fd1221, fd1219;
mul.f64 fd1223, fd1209, 0d3FE9E3779B97F4A8;
sub.f64 fd1224, fd912, fd1223;
fma.rn.f64 fd1225, fd1211, 0d3FD3C6EF372FE950, fd1224;
mul.f64 fd1226, fd1218, 0d3FE2CF2304755A5E;
mul.f64 fd1227, fd1220, 0d3FEE6F0E134454FF;
sub.f64 fd1228, fd1227, fd1226;
fma.rn.f64 fd1229, fd1212, 0d3FD3C6EF372FE950, fd916;
mul.f64 fd1230, fd1214, 0d3FE9E3779B97F4A8;
sub.f64 fd1231, fd1229, fd1230;
sub.f64 fd1232, fd956, fd1088;
mul.f64 fd1233, fd1232, 0d3FEE6F0E134454FF;
sub.f64 fd1234, fd1000, fd1044;
mul.f64 fd1235, fd1234, 0dBFE2CF2304755A5E;
sub.f64 fd1236, fd1235, fd1233;
mul.f64 fd1237, fd1212, 0d3FE9E3779B97F4A8;
sub.f64 fd1238, fd916, fd1237;
fma.rn.f64 fd1239, fd1214, 0d3FD3C6EF372FE950, fd1238;
mul.f64 fd1240, fd1232, 0d3FE2CF2304755A5E;
mul.f64 fd1241, fd1234, 0d3FEE6F0E134454FF;
sub.f64 fd1242, fd1241, fd1240;
add.f64 fd1243, fd1131, fd1146;
add.f64 fd1244, fd925, fd1243;
add.f64 fd1245, fd1136, fd1141;
add.f64 fd1246, fd1133, fd1148;
add.f64 fd1247, fd943, fd1246;
add.f64 fd1248, fd1138, fd1143;
fma.rn.f64 fd1249, fd1243, 0d3FD3C6EF372FE950, fd925;
mul.f64 fd1250, fd1245, 0d3FE9E3779B97F4A8;
sub.f64 fd1251, fd1249, fd1250;
sub.f64 fd1252, fd1133, fd1148;
mul.f64 fd1253, fd1252, 0d3FEE6F0E134454FF;
sub.f64 fd1254, fd1138, fd1143;
mul.f64 fd1255, fd1254, 0dBFE2CF2304755A5E;
sub.f64 fd1256, fd1255, fd1253;
mul.f64 fd1257, fd1243, 0d3FE9E3779B97F4A8;
sub.f64 fd1258, fd925, fd1257;
fma.rn.f64 fd1259, fd1245, 0d3FD3C6EF372FE950, fd1258;
mul.f64 fd1260, fd1252, 0d3FE2CF2304755A5E;
mul.f64 fd1261, fd1254, 0d3FEE6F0E134454FF;
sub.f64 fd1262, fd1261, fd1260;
fma.rn.f64 fd1263, fd1246, 0d3FD3C6EF372FE950, fd943;
mul.f64 fd1264, fd1248, 0d3FE9E3779B97F4A8;
sub.f64 fd1265, fd1263, fd1264;
sub.f64 fd1266, fd1131, fd1146;
mul.f64 fd1267, fd1266, 0d3FEE6F0E134454FF;
sub.f64 fd1268, fd1136, fd1141;
mul.f64 fd1269, fd1268, 0dBFE2CF2304755A5E;
sub.f64 fd1270, fd1269, fd1267;
mul.f64 fd1271, fd1246, 0d3FE9E3779B97F4A8;
sub.f64 fd1272, fd943, fd1271;
fma.rn.f64 fd1273, fd1248, 0d3FD3C6EF372FE950, fd1272;
mul.f64 fd1274, fd1266, 0d3FE2CF2304755A5E;
mul.f64 fd1275, fd1268, 0d3FEE6F0E134454FF;
sub.f64 fd1276, fd1275, fd1274;
add.f64 fd1277, fd1151, fd1166;
add.f64 fd1278, fd933, fd1277;
add.f64 fd1279, fd1156, fd1161;
add.f64 fd1280, fd1153, fd1168;
add.f64 fd1281, fd951, fd1280;
add.f64 fd1282, fd1158, fd1163;
fma.rn.f64 fd1283, fd1277, 0d3FD3C6EF372FE950, fd933;
mul.f64 fd1284, fd1279, 0d3FE9E3779B97F4A8;
sub.f64 fd1285, fd1283, fd1284;
sub.f64 fd1286, fd1153, fd1168;
mul.f64 fd1287, fd1286, 0d3FEE6F0E134454FF;
sub.f64 fd1288, fd1158, fd1163;
mul.f64 fd1289, fd1288, 0dBFE2CF2304755A5E;
sub.f64 fd1290, fd1289, fd1287;
mul.f64 fd1291, fd1277, 0d3FE9E3779B97F4A8;
sub.f64 fd1292, fd933, fd1291;
fma.rn.f64 fd1293, fd1279, 0d3FD3C6EF372FE950, fd1292;
mul.f64 fd1294, fd1286, 0d3FE2CF2304755A5E;
mul.f64 fd1295, fd1288, 0d3FEE6F0E134454FF;
sub.f64 fd1296, fd1295, fd1294;
fma.rn.f64 fd1297, fd1280, 0d3FD3C6EF372FE950, fd951;
mul.f64 fd1298, fd1282, 0d3FE9E3779B97F4A8;
sub.f64 fd1299, fd1297, fd1298;
sub.f64 fd1300, fd1151, fd1166;
mul.f64 fd1301, fd1300, 0d3FEE6F0E134454FF;
sub.f64 fd1302, fd1156, fd1161;
mul.f64 fd1303, fd1302, 0dBFE2CF2304755A5E;
sub.f64 fd1304, fd1303, fd1301;
mul.f64 fd1305, fd1280, 0d3FE9E3779B97F4A8;
sub.f64 fd1306, fd951, fd1305;
fma.rn.f64 fd1307, fd1282, 0d3FD3C6EF372FE950, fd1306;
mul.f64 fd1308, fd1300, 0d3FE2CF2304755A5E;
mul.f64 fd1309, fd1302, 0d3FEE6F0E134454FF;
sub.f64 fd1310, fd1309, fd1308;
add.f64 fd1311, fd1171, fd1186;
add.f64 fd1312, fd934, fd1311;
add.f64 fd1313, fd1176, fd1181;
add.f64 fd1314, fd1173, fd1188;
add.f64 fd1315, fd952, fd1314;
add.f64 fd1316, fd1178, fd1183;
fma.rn.f64 fd1317, fd1311, 0d3FD3C6EF372FE950, fd934;
mul.f64 fd1318, fd1313, 0d3FE9E3779B97F4A8;
sub.f64 fd1319, fd1317, fd1318;
sub.f64 fd1320, fd1173, fd1188;
mul.f64 fd1321, fd1320, 0d3FEE6F0E134454FF;
sub.f64 fd1322, fd1178, fd1183;
mul.f64 fd1323, fd1322, 0dBFE2CF2304755A5E;
sub.f64 fd1324, fd1323, fd1321;
mul.f64 fd1325, fd1311, 0d3FE9E3779B97F4A8;
sub.f64 fd1326, fd934, fd1325;
fma.rn.f64 fd1327, fd1313, 0d3FD3C6EF372FE950, fd1326;
mul.f64 fd1328, fd1320, 0d3FE2CF2304755A5E;
mul.f64 fd1329, fd1322, 0d3FEE6F0E134454FF;
sub.f64 fd1330, fd1329, fd1328;
fma.rn.f64 fd1331, fd1314, 0d3FD3C6EF372FE950, fd952;
mul.f64 fd1332, fd1316, 0d3FE9E3779B97F4A8;
sub.f64 fd1333, fd1331, fd1332;
sub.f64 fd1334, fd1171, fd1186;
mul.f64 fd1335, fd1334, 0d3FEE6F0E134454FF;
sub.f64 fd1336, fd1176, fd1181;
mul.f64 fd1337, fd1336, 0dBFE2CF2304755A5E;
sub.f64 fd1338, fd1337, fd1335;
mul.f64 fd1339, fd1314, 0d3FE9E3779B97F4A8;
sub.f64 fd1340, fd952, fd1339;
fma.rn.f64 fd1341, fd1316, 0d3FD3C6EF372FE950, fd1340;
mul.f64 fd1342, fd1334, 0d3FE2CF2304755A5E;
mul.f64 fd1343, fd1336, 0d3FEE6F0E134454FF;
sub.f64 fd1344, fd1343, fd1342;
add.f64 fd1345, fd1191, fd1206;
add.f64 fd1346, fd926, fd1345;
add.f64 fd1347, fd1196, fd1201;
add.f64 fd1348, fd1193, fd1208;
add.f64 fd1349, fd944, fd1348;
add.f64 fd1350, fd1198, fd1203;
fma.rn.f64 fd1351, fd1345, 0d3FD3C6EF372FE950, fd926;
mul.f64 fd1352, fd1347, 0d3FE9E3779B97F4A8;
sub.f64 fd1353, fd1351, fd1352;
sub.f64 fd1354, fd1193, fd1208;
mul.f64 fd1355, fd1354, 0d3FEE6F0E134454FF;
sub.f64 fd1356, fd1198, fd1203;
mul.f64 fd1357, fd1356, 0dBFE2CF2304755A5E;
sub.f64 fd1358, fd1357, fd1355;
mul.f64 fd1359, fd1345, 0d3FE9E3779B97F4A8;
sub.f64 fd1360, fd926, fd1359;
fma.rn.f64 fd1361, fd1347, 0d3FD3C6EF372FE950, fd1360;
mul.f64 fd1362, fd1354, 0d3FE2CF2304755A5E;
mul.f64 fd1363, fd1356, 0d3FEE6F0E134454FF;
sub.f64 fd1364, fd1363, fd1362;
fma.rn.f64 fd1365, fd1348, 0d3FD3C6EF372FE950, fd944;
mul.f64 fd1366, fd1350, 0d3FE9E3779B97F4A8;
sub.f64 fd1367, fd1365, fd1366;
sub.f64 fd1368, fd1191, fd1206;
mul.f64 fd1369, fd1368, 0d3FEE6F0E134454FF;
sub.f64 fd1370, fd1196, fd1201;
mul.f64 fd1371, fd1370, 0dBFE2CF2304755A5E;
sub.f64 fd1372, fd1371, fd1369;
mul.f64 fd1373, fd1348, 0d3FE9E3779B97F4A8;
sub.f64 fd1374, fd944, fd1373;
fma.rn.f64 fd1375, fd1350, 0d3FD3C6EF372FE950, fd1374;
mul.f64 fd1376, fd1368, 0d3FE2CF2304755A5E;
mul.f64 fd1377, fd1370, 0d3FEE6F0E134454FF;
sub.f64 fd1378, fd1377, fd1376;
add.f64 %0, fd1211, fd1210;
add.f64 %1, fd1214, fd1213;
add.f64 %3, fd1248, fd1247;
add.f64 %2, fd1245, fd1244;
add.f64 %5, fd1282, fd1281;
add.f64 %4, fd1279, fd1278;
add.f64 %7, fd1316, fd1315;
add.f64 %6, fd1313, fd1312;
add.f64 %9, fd1350, fd1349;
add.f64 %8, fd1347, fd1346;
add.f64 %11, fd1236, fd1231;
sub.f64 %10, fd1217, fd1222;
add.f64 %13, fd1270, fd1265;
sub.f64 %12, fd1251, fd1256;
add.f64 %15, fd1304, fd1299;
sub.f64 %14, fd1285, fd1290;
add.f64 %17, fd1338, fd1333;
sub.f64 %16, fd1319, fd1324;
add.f64 %19, fd1372, fd1367;
sub.f64 %18, fd1353, fd1358;
sub.f64 %20, fd1225, fd1228;
add.f64 %21, fd1242, fd1239;
add.f64 %23, fd1276, fd1273;
sub.f64 %22, fd1259, fd1262;
add.f64 %25, fd1310, fd1307;
sub.f64 %24, fd1293, fd1296;
add.f64 %27, fd1344, fd1341;
sub.f64 %26, fd1327, fd1330;
add.f64 %29, fd1378, fd1375;
sub.f64 %28, fd1361, fd1364;
add.f64 %30, fd1228, fd1225;
sub.f64 %31, fd1239, fd1242;
sub.f64 %33, fd1273, fd1276;
add.f64 %32, fd1262, fd1259;
sub.f64 %35, fd1307, fd1310;
add.f64 %34, fd1296, fd1293;
sub.f64 %37, fd1341, fd1344;
add.f64 %36, fd1330, fd1327;
sub.f64 %39, fd1375, fd1378;
add.f64 %38, fd1364, fd1361;
sub.f64 %41, fd1231, fd1236;
add.f64 %40, fd1222, fd1217;
sub.f64 %43, fd1265, fd1270;
add.f64 %42, fd1256, fd1251;
sub.f64 %45, fd1299, fd1304;
add.f64 %44, fd1290, fd1285;
sub.f64 %47, fd1333, fd1338;
add.f64 %46, fd1324, fd1319;
sub.f64 %49, fd1367, fd1372;
add.f64 %48, fd1358, fd1353;
})"
     : "=d"(rmem[0].x), "=d"(rmem[0].y), "=d"(rmem[1].x), "=d"(rmem[1].y), "=d"(rmem[2].x), "=d"(rmem[2].y), "=d"(rmem[3].x), "=d"(rmem[3].y), "=d"(rmem[4].x), "=d"(rmem[4].y), "=d"(rmem[5].x), "=d"(rmem[5].y), "=d"(rmem[6].x), "=d"(rmem[6].y), "=d"(rmem[7].x), "=d"(rmem[7].y), "=d"(rmem[8].x), "=d"(rmem[8].y), "=d"(rmem[9].x), "=d"(rmem[9].y), "=d"(rmem[10].x), "=d"(rmem[10].y), "=d"(rmem[11].x), "=d"(rmem[11].y), "=d"(rmem[12].x), "=d"(rmem[12].y), "=d"(rmem[13].x), "=d"(rmem[13].y), "=d"(rmem[14].x), "=d"(rmem[14].y), "=d"(rmem[15].x), "=d"(rmem[15].y), "=d"(rmem[16].x), "=d"(rmem[16].y), "=d"(rmem[17].x), "=d"(rmem[17].y), "=d"(rmem[18].x), "=d"(rmem[18].y), "=d"(rmem[19].x), "=d"(rmem[19].y), "=d"(rmem[20].x), "=d"(rmem[20].y), "=d"(rmem[21].x), "=d"(rmem[21].y), "=d"(rmem[22].x), "=d"(rmem[22].y), "=d"(rmem[23].x), "=d"(rmem[23].y), "=d"(rmem[24].x), "=d"(rmem[24].y): "r"(smem), "l"(lut_dp_25_625), "d"(rmem[0].x), "d"(rmem[0].y), "d"(rmem[1].x), "d"(rmem[1].y), "d"(rmem[1].y), "d"(rmem[2].x), "d"(rmem[2].y), "d"(rmem[2].y), "d"(rmem[3].x), "d"(rmem[3].y), "d"(rmem[4].x), "d"(rmem[4].y), "d"(rmem[4].y), "d"(rmem[5].x), "d"(rmem[5].y), "d"(rmem[5].y), "d"(rmem[6].x), "d"(rmem[6].y), "d"(rmem[7].x), "d"(rmem[7].y), "d"(rmem[7].y), "d"(rmem[8].x), "d"(rmem[8].y), "d"(rmem[8].y), "d"(rmem[9].x), "d"(rmem[9].y), "d"(rmem[10].x), "d"(rmem[10].y), "d"(rmem[10].y), "d"(rmem[11].x), "d"(rmem[11].y), "d"(rmem[11].y), "d"(rmem[12].x), "d"(rmem[12].y), "d"(rmem[13].x), "d"(rmem[13].y), "d"(rmem[13].y), "d"(rmem[14].x), "d"(rmem[14].y), "d"(rmem[14].y), "d"(rmem[15].x), "d"(rmem[15].y), "d"(rmem[16].x), "d"(rmem[16].y), "d"(rmem[16].y), "d"(rmem[17].x), "d"(rmem[17].y), "d"(rmem[17].y), "d"(rmem[18].x), "d"(rmem[18].y), "d"(rmem[19].x), "d"(rmem[19].y), "d"(rmem[19].y), "d"(rmem[20].x), "d"(rmem[20].y), "d"(rmem[20].y), "d"(rmem[21].x), "d"(rmem[21].y), "d"(rmem[22].x), "d"(rmem[22].y), "d"(rmem[22].y), "d"(rmem[23].x), "d"(rmem[23].y), "d"(rmem[23].y), "d"(rmem[24].x), "d"(rmem[24].y));
};




template<> __forceinline__ __device__ void cufftdx_private_function<543, double, 1>(cufftdx::detail::complex<double> *rmem, unsigned smem){

asm volatile (R"({
.reg .b32 r<14>;
.reg .f64 fd<1788>;
.reg .b64 rd<10>;
mov.u32 r12, %tid.y;
mov.u32 r13, %50;
mad.lo.s32 r3, r12, 10000, r13;
add.f64 fd101, %62, %92;
add.f64 fd103, %72, %82;
add.f64 fd1787, %52, fd101;
add.f64 fd104, fd103, fd1787;
add.f64 fd105, %102, %104;
add.f64 fd107, %103, %83;
add.f64 fd1783, %53, fd105;
add.f64 fd108, fd107, fd1783;
mul.f64 fd110, fd103, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1782, fd101, 0d3FD3C6EF372FE950, %52;
sub.f64 fd111, fd1782, fd110;
sub.f64 fd112, %102, %104;
sub.f64 fd114, %103, %83;
mul.f64 fd1780, fd112, 0d3FEE6F0E134454FF;
mul.f64 fd1781, fd114, 0dBFE2CF2304755A5E;
sub.f64 fd116, fd1781, fd1780;
sub.f64 fd117, fd111, fd116;
add.f64 fd118, fd116, fd111;
mul.f64 fd119, fd101, 0d3FE9E3779B97F4A8;
sub.f64 fd120, %52, fd119;
fma.rn.f64 fd121, fd103, 0d3FD3C6EF372FE950, fd120;
mul.f64 fd122, fd112, 0d3FE2CF2304755A5E;
mul.f64 fd123, fd114, 0d3FEE6F0E134454FF;
sub.f64 fd124, fd123, fd122;
sub.f64 fd125, fd121, fd124;
add.f64 fd126, fd124, fd121;
fma.rn.f64 fd1778, fd105, 0d3FD3C6EF372FE950, %53;
mul.f64 fd1779, fd107, 0d3FE9E3779B97F4A8;
sub.f64 fd129, fd1778, fd1779;
sub.f64 fd130, %62, %92;
sub.f64 fd132, %72, %82;
mul.f64 fd1776, fd130, 0d3FEE6F0E134454FF;
mul.f64 fd1777, fd132, 0dBFE2CF2304755A5E;
sub.f64 fd134, fd1777, fd1776;
add.f64 fd135, fd134, fd129;
sub.f64 fd136, fd129, fd134;
mul.f64 fd137, fd105, 0d3FE9E3779B97F4A8;
sub.f64 fd138, %53, fd137;
fma.rn.f64 fd139, fd107, 0d3FD3C6EF372FE950, fd138;
mul.f64 fd140, fd130, 0d3FE2CF2304755A5E;
mul.f64 fd141, fd132, 0d3FEE6F0E134454FF;
sub.f64 fd142, fd141, fd140;
add.f64 fd143, fd142, fd139;
sub.f64 fd144, fd139, fd142;
add.f64 fd145, %64, %94;
add.f64 fd147, %74, %84;
add.f64 fd1775, %54, fd145;
add.f64 fd148, fd147, fd1775;
add.f64 fd149, %65, %95;
add.f64 fd151, %107, %105;
add.f64 fd1771, %106, fd149;
add.f64 fd152, fd151, fd1771;
fma.rn.f64 fd1769, fd145, 0d3FD3C6EF372FE950, %54;
mul.f64 fd1770, fd147, 0d3FE9E3779B97F4A8;
sub.f64 fd155, fd1769, fd1770;
sub.f64 fd156, %65, %95;
sub.f64 fd158, %107, %105;
mul.f64 fd1767, fd156, 0d3FEE6F0E134454FF;
mul.f64 fd1768, fd158, 0dBFE2CF2304755A5E;
sub.f64 fd160, fd1768, fd1767;
sub.f64 fd161, fd155, fd160;
add.f64 fd162, fd160, fd155;
mul.f64 fd163, fd145, 0d3FE9E3779B97F4A8;
sub.f64 fd164, %54, fd163;
fma.rn.f64 fd165, fd147, 0d3FD3C6EF372FE950, fd164;
mul.f64 fd166, fd156, 0d3FE2CF2304755A5E;
mul.f64 fd167, fd158, 0d3FEE6F0E134454FF;
sub.f64 fd168, fd167, fd166;
sub.f64 fd169, fd165, fd168;
add.f64 fd170, fd168, fd165;
mul.f64 fd172, fd151, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1766, fd149, 0d3FD3C6EF372FE950, %106;
sub.f64 fd173, fd1766, fd172;
sub.f64 fd174, %64, %94;
sub.f64 fd176, %74, %84;
mul.f64 fd177, fd176, 0dBFE2CF2304755A5E;
mul.f64 fd1765, fd174, 0d3FEE6F0E134454FF;
sub.f64 fd178, fd177, fd1765;
add.f64 fd179, fd178, fd173;
sub.f64 fd180, fd173, fd178;
mul.f64 fd181, fd149, 0d3FE9E3779B97F4A8;
sub.f64 fd182, %106, fd181;
fma.rn.f64 fd183, fd151, 0d3FD3C6EF372FE950, fd182;
mul.f64 fd184, fd174, 0d3FE2CF2304755A5E;
mul.f64 fd185, fd176, 0d3FEE6F0E134454FF;
sub.f64 fd186, fd185, fd184;
add.f64 fd187, fd186, fd183;
sub.f64 fd188, fd183, fd186;
add.f64 fd189, %66, %96;
add.f64 fd191, %76, %86;
add.f64 fd1764, %56, fd189;
add.f64 fd192, fd191, fd1764;
add.f64 fd193, %110, %109;
add.f64 fd195, %77, %111;
add.f64 fd1759, %108, fd193;
add.f64 fd196, fd195, fd1759;
mul.f64 fd198, fd191, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1758, fd189, 0d3FD3C6EF372FE950, %56;
sub.f64 fd199, fd1758, fd198;
sub.f64 fd200, %110, %109;
sub.f64 fd202, %77, %111;
mul.f64 fd203, fd202, 0dBFE2CF2304755A5E;
mul.f64 fd1757, fd200, 0d3FEE6F0E134454FF;
sub.f64 fd204, fd203, fd1757;
sub.f64 fd205, fd199, fd204;
add.f64 fd206, fd204, fd199;
mul.f64 fd207, fd189, 0d3FE9E3779B97F4A8;
sub.f64 fd208, %56, fd207;
fma.rn.f64 fd209, fd191, 0d3FD3C6EF372FE950, fd208;
mul.f64 fd210, fd200, 0d3FE2CF2304755A5E;
mul.f64 fd211, fd202, 0d3FEE6F0E134454FF;
sub.f64 fd212, fd211, fd210;
sub.f64 fd213, fd209, fd212;
add.f64 fd214, fd212, fd209;
fma.rn.f64 fd1755, fd193, 0d3FD3C6EF372FE950, %108;
mul.f64 fd1756, fd195, 0d3FE9E3779B97F4A8;
sub.f64 fd217, fd1755, fd1756;
sub.f64 fd218, %66, %96;
sub.f64 fd220, %76, %86;
mul.f64 fd1753, fd218, 0d3FEE6F0E134454FF;
mul.f64 fd1754, fd220, 0dBFE2CF2304755A5E;
sub.f64 fd222, fd1754, fd1753;
add.f64 fd223, fd222, fd217;
sub.f64 fd224, fd217, fd222;
mul.f64 fd225, fd193, 0d3FE9E3779B97F4A8;
sub.f64 fd226, %108, fd225;
fma.rn.f64 fd227, fd195, 0d3FD3C6EF372FE950, fd226;
mul.f64 fd228, fd218, 0d3FE2CF2304755A5E;
mul.f64 fd229, fd220, 0d3FEE6F0E134454FF;
sub.f64 fd230, fd229, fd228;
add.f64 fd231, fd230, fd227;
sub.f64 fd232, fd227, fd230;
add.f64 fd233, %68, %98;
add.f64 fd235, %78, %88;
add.f64 fd1752, %58, fd233;
add.f64 fd236, fd235, fd1752;
add.f64 fd237, %113, %112;
add.f64 fd239, %114, %89;
add.f64 fd1748, %59, fd237;
add.f64 fd240, fd239, fd1748;
fma.rn.f64 fd1746, fd233, 0d3FD3C6EF372FE950, %58;
mul.f64 fd1747, fd235, 0d3FE9E3779B97F4A8;
sub.f64 fd243, fd1746, fd1747;
sub.f64 fd244, %113, %112;
sub.f64 fd246, %114, %89;
mul.f64 fd1744, fd244, 0d3FEE6F0E134454FF;
mul.f64 fd1745, fd246, 0dBFE2CF2304755A5E;
sub.f64 fd248, fd1745, fd1744;
sub.f64 fd249, fd243, fd248;
add.f64 fd250, fd248, fd243;
mul.f64 fd251, fd233, 0d3FE9E3779B97F4A8;
sub.f64 fd252, %58, fd251;
fma.rn.f64 fd253, fd235, 0d3FD3C6EF372FE950, fd252;
mul.f64 fd254, fd244, 0d3FE2CF2304755A5E;
mul.f64 fd255, fd246, 0d3FEE6F0E134454FF;
sub.f64 fd256, fd255, fd254;
sub.f64 fd257, fd253, fd256;
add.f64 fd258, fd256, fd253;
mul.f64 fd260, fd239, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1743, fd237, 0d3FD3C6EF372FE950, %59;
sub.f64 fd261, fd1743, fd260;
sub.f64 fd262, %68, %98;
sub.f64 fd264, %78, %88;
mul.f64 fd1741, fd262, 0d3FEE6F0E134454FF;
mul.f64 fd1742, fd264, 0dBFE2CF2304755A5E;
sub.f64 fd266, fd1742, fd1741;
add.f64 fd267, fd266, fd261;
sub.f64 fd268, fd261, fd266;
mul.f64 fd269, fd237, 0d3FE9E3779B97F4A8;
sub.f64 fd270, %59, fd269;
fma.rn.f64 fd271, fd239, 0d3FD3C6EF372FE950, fd270;
mul.f64 fd272, fd262, 0d3FE2CF2304755A5E;
mul.f64 fd273, fd264, 0d3FEE6F0E134454FF;
sub.f64 fd274, fd273, fd272;
add.f64 fd275, fd274, fd271;
sub.f64 fd276, fd271, fd274;
add.f64 fd277, %70, %100;
add.f64 fd279, %80, %90;
add.f64 fd1740, %60, fd277;
add.f64 fd280, fd279, fd1740;
add.f64 fd281, %71, %101;
add.f64 fd283, %117, %115;
add.f64 fd1736, %116, fd281;
add.f64 fd284, fd283, fd1736;
mul.f64 fd286, fd279, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1735, fd277, 0d3FD3C6EF372FE950, %60;
sub.f64 fd287, fd1735, fd286;
sub.f64 fd288, %71, %101;
sub.f64 fd290, %117, %115;
mul.f64 fd1733, fd288, 0d3FEE6F0E134454FF;
mul.f64 fd1734, fd290, 0dBFE2CF2304755A5E;
sub.f64 fd292, fd1734, fd1733;
sub.f64 fd293, fd287, fd292;
add.f64 fd294, fd292, fd287;
mul.f64 fd295, fd277, 0d3FE9E3779B97F4A8;
sub.f64 fd296, %60, fd295;
fma.rn.f64 fd297, fd279, 0d3FD3C6EF372FE950, fd296;
mul.f64 fd298, fd288, 0d3FE2CF2304755A5E;
mul.f64 fd299, fd290, 0d3FEE6F0E134454FF;
sub.f64 fd300, fd299, fd298;
sub.f64 fd301, fd297, fd300;
add.f64 fd302, fd300, fd297;
mul.f64 fd304, fd283, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1732, fd281, 0d3FD3C6EF372FE950, %116;
sub.f64 fd305, fd1732, fd304;
sub.f64 fd306, %70, %100;
sub.f64 fd308, %80, %90;
mul.f64 fd1730, fd306, 0d3FEE6F0E134454FF;
mul.f64 fd1731, fd308, 0dBFE2CF2304755A5E;
sub.f64 fd310, fd1731, fd1730;
add.f64 fd311, fd310, fd305;
sub.f64 fd312, fd305, fd310;
mul.f64 fd313, fd281, 0d3FE9E3779B97F4A8;
sub.f64 fd314, %116, fd313;
fma.rn.f64 fd315, fd283, 0d3FD3C6EF372FE950, fd314;
mul.f64 fd316, fd306, 0d3FE2CF2304755A5E;
mul.f64 fd317, fd308, 0d3FEE6F0E134454FF;
sub.f64 fd318, fd317, fd316;
add.f64 fd319, fd318, fd315;
sub.f64 fd320, fd315, fd318;
mul.f64 fd322, fd179, 0dBFCFD511FA1C0796;
mul.f64 fd1729, fd161, 0d3FEEFEA21D101EE0;
sub.f64 fd323, fd1729, fd322;
mul.f64 fd324, fd179, 0d3FEEFEA21D101EE0;
fma.rn.f64 fd325, fd161, 0dBFCFD511FA1C0796, fd324;
mul.f64 fd327, fd223, 0dBFDED50D5CBFA951;
mul.f64 fd1728, fd205, 0d3FEC0AB44E81C059;
sub.f64 fd328, fd1728, fd327;
mul.f64 fd329, fd223, 0d3FEC0AB44E81C059;
fma.rn.f64 fd330, fd205, 0dBFDED50D5CBFA951, fd329;
mul.f64 fd332, fd267, 0dBFE5E7CF55112014;
mul.f64 fd1727, fd249, 0d3FE753B603D2B816;
sub.f64 fd333, fd1727, fd332;
mul.f64 fd334, fd267, 0d3FE753B603D2B816;
fma.rn.f64 fd335, fd249, 0dBFE5E7CF55112014, fd334;
mul.f64 fd337, fd311, 0dBFEB04BBFF642E86;
mul.f64 fd1726, fd293, 0d3FE1257E3C182B51;
sub.f64 fd338, fd1726, fd337;
mul.f64 fd339, fd311, 0d3FE1257E3C182B51;
fma.rn.f64 fd340, fd293, 0dBFEB04BBFF642E86, fd339;
mul.f64 fd342, fd187, 0dBFDED50D5CBFA951;
mul.f64 fd1725, fd169, 0d3FEC0AB44E81C059;
sub.f64 fd343, fd1725, fd342;
mul.f64 fd344, fd187, 0d3FEC0AB44E81C059;
fma.rn.f64 fd345, fd169, 0dBFDED50D5CBFA951, fd344;
mul.f64 fd1723, fd213, 0d3FE1257E3C182B51;
mul.f64 fd1724, fd231, 0dBFEB04BBFF642E86;
sub.f64 fd348, fd1723, fd1724;
mul.f64 fd349, fd231, 0d3FE1257E3C182B51;
fma.rn.f64 fd350, fd213, 0dBFEB04BBFF642E86, fd349;
mul.f64 fd1721, fd257, 0d3FB0130A1BE09379;
mul.f64 fd1722, fd275, 0dBFEFEFD5BFE443FE;
sub.f64 fd353, fd1721, fd1722;
mul.f64 fd354, fd275, 0d3FB0130A1BE09379;
fma.rn.f64 fd355, fd257, 0dBFEFEFD5BFE443FE, fd354;
mul.f64 fd1719, fd301, 0dBFDB3FF7C925819C;
mul.f64 fd1720, fd319, 0dBFECF457DCDC158C;
sub.f64 fd358, fd1719, fd1720;
mul.f64 fd359, fd319, 0dBFDB3FF7C925819C;
fma.rn.f64 fd360, fd301, 0dBFECF457DCDC158C, fd359;
mul.f64 fd1717, fd170, 0d3FE753B603D2B816;
mul.f64 fd1718, fd188, 0dBFE5E7CF55112014;
sub.f64 fd363, fd1717, fd1718;
mul.f64 fd364, fd188, 0d3FE753B603D2B816;
fma.rn.f64 fd365, fd170, 0dBFE5E7CF55112014, fd364;
mul.f64 fd367, fd232, 0dBFEFEFD5BFE443FE;
mul.f64 fd1716, fd214, 0d3FB0130A1BE09379;
sub.f64 fd368, fd1716, fd367;
mul.f64 fd369, fd232, 0d3FB0130A1BE09379;
fma.rn.f64 fd370, fd214, 0dBFEFEFD5BFE443FE, fd369;
mul.f64 fd372, fd276, 0dBFE8A80B635B6BEA;
mul.f64 fd1715, fd258, 0dBFE465C6FEB501BC;
sub.f64 fd373, fd1715, fd372;
mul.f64 fd374, fd276, 0dBFE465C6FEB501BC;
fma.rn.f64 fd375, fd258, 0dBFE8A80B635B6BEA, fd374;
mul.f64 fd377, fd320, 0dBFC00AEB5DA15BE0;
mul.f64 fd1714, fd302, 0dBFEFBF675480D903;
sub.f64 fd378, fd1714, fd377;
mul.f64 fd379, fd320, 0dBFEFBF675480D903;
fma.rn.f64 fd380, fd302, 0dBFC00AEB5DA15BE0, fd379;
mul.f64 fd382, fd180, 0dBFEB04BBFF642E86;
mul.f64 fd1713, fd162, 0d3FE1257E3C182B51;
sub.f64 fd383, fd1713, fd382;
mul.f64 fd384, fd180, 0d3FE1257E3C182B51;
fma.rn.f64 fd385, fd162, 0dBFEB04BBFF642E86, fd384;
mul.f64 fd387, fd224, 0dBFECF457DCDC158C;
mul.f64 fd1712, fd206, 0dBFDB3FF7C925819C;
sub.f64 fd388, fd1712, fd387;
mul.f64 fd389, fd224, 0dBFDB3FF7C925819C;
fma.rn.f64 fd390, fd206, 0dBFECF457DCDC158C, fd389;
mul.f64 fd1710, fd250, 0dBFEFBF675480D903;
mul.f64 fd1711, fd268, 0dBFC00AEB5DA15BE0;
sub.f64 fd393, fd1710, fd1711;
mul.f64 fd394, fd268, 0dBFEFBF675480D903;
fma.rn.f64 fd395, fd250, 0dBFC00AEB5DA15BE0, fd394;
mul.f64 fd1708, fd294, 0dBFE465C6FEB501BC;
mul.f64 fd1709, fd312, 0d3FE8A80B635B6BEA;
sub.f64 fd398, fd1708, fd1709;
mul.f64 fd399, fd312, 0dBFE465C6FEB501BC;
fma.rn.f64 fd400, fd294, 0d3FE8A80B635B6BEA, fd399;
add.f64 fd401, fd148, fd280;
add.f64 fd403, fd192, fd236;
mul.f64 fd408, fd403, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1707, fd401, 0d3FD3C6EF372FE950, fd104;
sub.f64 fd409, fd1707, fd408;
add.f64 fd1706, fd152, fd284;
sub.f64 fd410, fd152, fd284;
add.f64 fd1705, fd196, fd240;
sub.f64 fd412, fd196, fd240;
mul.f64 fd413, fd412, 0dBFE2CF2304755A5E;
mul.f64 fd1704, fd410, 0d3FEE6F0E134454FF;
sub.f64 fd414, fd413, fd1704;
sub.f64 fd415, fd409, fd414;
add.f64 fd416, fd414, fd409;
add.f64 fd1703, fd104, fd401;
mul.f64 fd417, fd401, 0d3FE9E3779B97F4A8;
sub.f64 fd418, fd104, fd417;
fma.rn.f64 fd419, fd403, 0d3FD3C6EF372FE950, fd418;
mul.f64 fd420, fd410, 0d3FE2CF2304755A5E;
mul.f64 fd421, fd412, 0d3FEE6F0E134454FF;
sub.f64 fd422, fd421, fd420;
sub.f64 fd423, fd419, fd422;
add.f64 fd424, fd422, fd419;
fma.rn.f64 fd1701, fd1706, 0d3FD3C6EF372FE950, fd108;
mul.f64 fd1702, fd1705, 0d3FE9E3779B97F4A8;
sub.f64 fd427, fd1701, fd1702;
sub.f64 fd428, fd148, fd280;
sub.f64 fd430, fd192, fd236;
mul.f64 fd1699, fd428, 0d3FEE6F0E134454FF;
mul.f64 fd1700, fd430, 0dBFE2CF2304755A5E;
sub.f64 fd432, fd1700, fd1699;
add.f64 fd433, fd432, fd427;
sub.f64 fd434, fd427, fd432;
add.f64 fd1698, fd108, fd1706;
mul.f64 fd435, fd1706, 0d3FE9E3779B97F4A8;
sub.f64 fd436, fd108, fd435;
fma.rn.f64 fd437, fd1705, 0d3FD3C6EF372FE950, fd436;
mul.f64 fd438, fd428, 0d3FE2CF2304755A5E;
mul.f64 fd439, fd430, 0d3FEE6F0E134454FF;
sub.f64 fd440, fd439, fd438;
add.f64 fd441, fd440, fd437;
sub.f64 fd442, fd437, fd440;
add.f64 fd443, fd323, fd338;
add.f64 fd445, fd328, fd333;
add.f64 fd1697, fd117, fd443;
add.f64 fd446, fd445, fd1697;
add.f64 fd447, fd325, fd340;
add.f64 fd449, fd330, fd335;
add.f64 fd1696, fd135, fd447;
add.f64 fd450, fd449, fd1696;
fma.rn.f64 fd1694, fd443, 0d3FD3C6EF372FE950, fd117;
mul.f64 fd1695, fd445, 0d3FE9E3779B97F4A8;
sub.f64 fd453, fd1694, fd1695;
sub.f64 fd454, fd325, fd340;
sub.f64 fd456, fd330, fd335;
mul.f64 fd1692, fd454, 0d3FEE6F0E134454FF;
mul.f64 fd1693, fd456, 0dBFE2CF2304755A5E;
sub.f64 fd458, fd1693, fd1692;
sub.f64 fd459, fd453, fd458;
add.f64 fd460, fd458, fd453;
mul.f64 fd461, fd443, 0d3FE9E3779B97F4A8;
sub.f64 fd462, fd117, fd461;
fma.rn.f64 fd463, fd445, 0d3FD3C6EF372FE950, fd462;
mul.f64 fd464, fd454, 0d3FE2CF2304755A5E;
mul.f64 fd465, fd456, 0d3FEE6F0E134454FF;
sub.f64 fd466, fd465, fd464;
sub.f64 fd467, fd463, fd466;
add.f64 fd468, fd466, fd463;
mul.f64 fd470, fd449, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1691, fd447, 0d3FD3C6EF372FE950, fd135;
sub.f64 fd471, fd1691, fd470;
sub.f64 fd472, fd323, fd338;
sub.f64 fd474, fd328, fd333;
mul.f64 fd1689, fd472, 0d3FEE6F0E134454FF;
mul.f64 fd1690, fd474, 0dBFE2CF2304755A5E;
sub.f64 fd476, fd1690, fd1689;
add.f64 fd477, fd476, fd471;
sub.f64 fd478, fd471, fd476;
mul.f64 fd479, fd447, 0d3FE9E3779B97F4A8;
sub.f64 fd480, fd135, fd479;
fma.rn.f64 fd481, fd449, 0d3FD3C6EF372FE950, fd480;
mul.f64 fd482, fd472, 0d3FE2CF2304755A5E;
mul.f64 fd483, fd474, 0d3FEE6F0E134454FF;
sub.f64 fd484, fd483, fd482;
add.f64 fd485, fd484, fd481;
sub.f64 fd486, fd481, fd484;
add.f64 fd487, fd343, fd358;
add.f64 fd489, fd348, fd353;
add.f64 fd1688, fd125, fd487;
add.f64 fd490, fd489, fd1688;
add.f64 fd491, fd345, fd360;
add.f64 fd493, fd350, fd355;
add.f64 fd1687, fd143, fd491;
add.f64 fd494, fd493, fd1687;
mul.f64 fd496, fd489, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1686, fd487, 0d3FD3C6EF372FE950, fd125;
sub.f64 fd497, fd1686, fd496;
sub.f64 fd498, fd345, fd360;
sub.f64 fd500, fd350, fd355;
mul.f64 fd1684, fd498, 0d3FEE6F0E134454FF;
mul.f64 fd1685, fd500, 0dBFE2CF2304755A5E;
sub.f64 fd502, fd1685, fd1684;
sub.f64 fd503, fd497, fd502;
add.f64 fd504, fd502, fd497;
mul.f64 fd505, fd487, 0d3FE9E3779B97F4A8;
sub.f64 fd506, fd125, fd505;
fma.rn.f64 fd507, fd489, 0d3FD3C6EF372FE950, fd506;
mul.f64 fd508, fd498, 0d3FE2CF2304755A5E;
mul.f64 fd509, fd500, 0d3FEE6F0E134454FF;
sub.f64 fd510, fd509, fd508;
sub.f64 fd511, fd507, fd510;
add.f64 fd512, fd510, fd507;
mul.f64 fd514, fd493, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1683, fd491, 0d3FD3C6EF372FE950, fd143;
sub.f64 fd515, fd1683, fd514;
sub.f64 fd516, fd343, fd358;
sub.f64 fd518, fd348, fd353;
mul.f64 fd1681, fd516, 0d3FEE6F0E134454FF;
mul.f64 fd1682, fd518, 0dBFE2CF2304755A5E;
sub.f64 fd520, fd1682, fd1681;
add.f64 fd521, fd520, fd515;
sub.f64 fd522, fd515, fd520;
mul.f64 fd523, fd491, 0d3FE9E3779B97F4A8;
sub.f64 fd524, fd143, fd523;
fma.rn.f64 fd525, fd493, 0d3FD3C6EF372FE950, fd524;
mul.f64 fd526, fd516, 0d3FE2CF2304755A5E;
mul.f64 fd527, fd518, 0d3FEE6F0E134454FF;
sub.f64 fd528, fd527, fd526;
add.f64 fd529, fd528, fd525;
sub.f64 fd530, fd525, fd528;
add.f64 fd531, fd363, fd378;
add.f64 fd533, fd368, fd373;
add.f64 fd1680, fd126, fd531;
add.f64 fd534, fd533, fd1680;
add.f64 fd535, fd365, fd380;
add.f64 fd537, fd370, fd375;
add.f64 fd1679, fd144, fd535;
add.f64 fd538, fd537, fd1679;
mul.f64 fd540, fd533, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1678, fd531, 0d3FD3C6EF372FE950, fd126;
sub.f64 fd541, fd1678, fd540;
sub.f64 fd542, fd365, fd380;
sub.f64 fd544, fd370, fd375;
mul.f64 fd1676, fd542, 0d3FEE6F0E134454FF;
mul.f64 fd1677, fd544, 0dBFE2CF2304755A5E;
sub.f64 fd546, fd1677, fd1676;
sub.f64 fd547, fd541, fd546;
add.f64 fd548, fd546, fd541;
mul.f64 fd549, fd531, 0d3FE9E3779B97F4A8;
sub.f64 fd550, fd126, fd549;
fma.rn.f64 fd551, fd533, 0d3FD3C6EF372FE950, fd550;
mul.f64 fd552, fd542, 0d3FE2CF2304755A5E;
mul.f64 fd553, fd544, 0d3FEE6F0E134454FF;
sub.f64 fd554, fd553, fd552;
sub.f64 fd555, fd551, fd554;
add.f64 fd556, fd554, fd551;
fma.rn.f64 fd1674, fd535, 0d3FD3C6EF372FE950, fd144;
mul.f64 fd1675, fd537, 0d3FE9E3779B97F4A8;
sub.f64 fd559, fd1674, fd1675;
sub.f64 fd560, fd363, fd378;
sub.f64 fd562, fd368, fd373;
mul.f64 fd1672, fd560, 0d3FEE6F0E134454FF;
mul.f64 fd1673, fd562, 0dBFE2CF2304755A5E;
sub.f64 fd564, fd1673, fd1672;
add.f64 fd565, fd564, fd559;
sub.f64 fd566, fd559, fd564;
mul.f64 fd567, fd535, 0d3FE9E3779B97F4A8;
sub.f64 fd568, fd144, fd567;
fma.rn.f64 fd569, fd537, 0d3FD3C6EF372FE950, fd568;
mul.f64 fd570, fd560, 0d3FE2CF2304755A5E;
mul.f64 fd571, fd562, 0d3FEE6F0E134454FF;
sub.f64 fd572, fd571, fd570;
add.f64 fd573, fd572, fd569;
sub.f64 fd574, fd569, fd572;
add.f64 fd575, fd383, fd398;
add.f64 fd577, fd388, fd393;
add.f64 fd1671, fd118, fd575;
add.f64 fd578, fd577, fd1671;
add.f64 fd579, fd385, fd400;
add.f64 fd581, fd390, fd395;
add.f64 fd1670, fd136, fd579;
add.f64 fd582, fd581, fd1670;
fma.rn.f64 fd1668, fd575, 0d3FD3C6EF372FE950, fd118;
mul.f64 fd1669, fd577, 0d3FE9E3779B97F4A8;
sub.f64 fd585, fd1668, fd1669;
sub.f64 fd586, fd385, fd400;
sub.f64 fd588, fd390, fd395;
mul.f64 fd1666, fd586, 0d3FEE6F0E134454FF;
mul.f64 fd1667, fd588, 0dBFE2CF2304755A5E;
sub.f64 fd590, fd1667, fd1666;
sub.f64 fd591, fd585, fd590;
add.f64 fd592, fd590, fd585;
mul.f64 fd593, fd575, 0d3FE9E3779B97F4A8;
sub.f64 fd594, fd118, fd593;
fma.rn.f64 fd595, fd577, 0d3FD3C6EF372FE950, fd594;
mul.f64 fd596, fd586, 0d3FE2CF2304755A5E;
mul.f64 fd597, fd588, 0d3FEE6F0E134454FF;
sub.f64 fd598, fd597, fd596;
sub.f64 fd599, fd595, fd598;
add.f64 fd600, fd598, fd595;
mul.f64 fd602, fd581, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1665, fd579, 0d3FD3C6EF372FE950, fd136;
sub.f64 fd603, fd1665, fd602;
sub.f64 fd604, fd383, fd398;
sub.f64 fd606, fd388, fd393;
mul.f64 fd1663, fd604, 0d3FEE6F0E134454FF;
mul.f64 fd1664, fd606, 0dBFE2CF2304755A5E;
sub.f64 fd608, fd1664, fd1663;
add.f64 fd609, fd608, fd603;
sub.f64 fd610, fd603, fd608;
mul.f64 fd611, fd579, 0d3FE9E3779B97F4A8;
sub.f64 fd612, fd136, fd611;
fma.rn.f64 fd613, fd581, 0d3FD3C6EF372FE950, fd612;
mul.f64 fd614, fd604, 0d3FE2CF2304755A5E;
mul.f64 fd615, fd606, 0d3FEE6F0E134454FF;
sub.f64 fd616, fd615, fd614;
add.f64 fd617, fd616, fd613;
sub.f64 fd618, fd613, fd616;
mov.u32 r11, %tid.x;
mul.wide.u32 rd2, r11, 1374389535;
shr.u64 rd3, rd2, 35;
cvt.u32.u64 r5, rd3;
mul.lo.s32 r6, r5, 25;
sub.s32 r7, r11, r6;
mad.lo.s32 r8, r5, 10000, r3;
mov.u64 rd5, %51;
mul.wide.u32 rd7, r7, 16;
add.s64 rd6, rd5, rd7;
ld.global.v2.f64 {fd619, fd620}, [rd6];
mul.f64 fd624, fd620, fd450;
mul.f64 fd625, fd619, fd450;
mul.f64 fd627, fd620, fd620;
mul.f64 fd1662, fd619, fd619;
sub.f64 fd628, fd1662, fd627;
mul.f64 fd629, fd620, fd619;
fma.rn.f64 fd630, fd620, fd619, fd629;
mul.f64 fd632, fd630, fd494;
mul.f64 fd633, fd628, fd494;
mul.f64 fd1660, fd619, fd628;
mul.f64 fd1661, fd620, fd630;
sub.f64 fd636, fd1660, fd1661;
mul.f64 fd1659, fd628, fd490;
mul.f64 fd637, fd619, fd630;
fma.rn.f64 fd638, fd620, fd628, fd637;
mul.f64 fd640, fd638, fd538;
mul.f64 fd641, fd636, fd538;
mul.f64 fd643, fd620, fd638;
mul.f64 fd1658, fd619, fd636;
sub.f64 fd644, fd1658, fd643;
mul.f64 fd1657, fd636, fd534;
mul.f64 fd645, fd619, fd638;
fma.rn.f64 fd646, fd620, fd636, fd645;
mul.f64 fd648, fd646, fd582;
mul.f64 fd649, fd644, fd582;
mul.f64 fd1655, fd619, fd644;
mul.f64 fd1656, fd620, fd646;
sub.f64 fd652, fd1655, fd1656;
mul.f64 fd1654, fd644, fd578;
mul.f64 fd653, fd619, fd646;
fma.rn.f64 fd654, fd620, fd644, fd653;
mul.f64 fd656, fd654, fd433;
mul.f64 fd657, fd652, fd433;
mul.f64 fd659, fd620, fd654;
mul.f64 fd1653, fd619, fd652;
sub.f64 fd660, fd1653, fd659;
mul.f64 fd1652, fd652, fd415;
mul.f64 fd661, fd619, fd654;
fma.rn.f64 fd662, fd620, fd652, fd661;
mul.f64 fd664, fd662, fd477;
mul.f64 fd665, fd660, fd477;
mul.f64 fd667, fd620, fd662;
mul.f64 fd1651, fd619, fd660;
sub.f64 fd668, fd1651, fd667;
mul.f64 fd1650, fd660, fd459;
mul.f64 fd669, fd619, fd662;
fma.rn.f64 fd670, fd620, fd660, fd669;
mul.f64 fd672, fd670, fd521;
mul.f64 fd673, fd668, fd521;
mul.f64 fd1648, fd619, fd668;
mul.f64 fd1649, fd620, fd670;
sub.f64 fd676, fd1648, fd1649;
mul.f64 fd1647, fd668, fd503;
mul.f64 fd677, fd619, fd670;
fma.rn.f64 fd678, fd620, fd668, fd677;
mul.f64 fd680, fd678, fd565;
mul.f64 fd681, fd676, fd565;
mul.f64 fd683, fd620, fd678;
mul.f64 fd1646, fd619, fd676;
sub.f64 fd684, fd1646, fd683;
mul.f64 fd1645, fd676, fd547;
mul.f64 fd685, fd619, fd678;
fma.rn.f64 fd686, fd620, fd676, fd685;
mul.f64 fd688, fd686, fd609;
mul.f64 fd689, fd684, fd609;
mul.f64 fd691, fd620, fd686;
mul.f64 fd1644, fd619, fd684;
sub.f64 fd692, fd1644, fd691;
mul.f64 fd1643, fd684, fd591;
mul.f64 fd693, fd619, fd686;
fma.rn.f64 fd694, fd620, fd684, fd693;
mul.f64 fd696, fd694, fd441;
mul.f64 fd697, fd692, fd441;
mul.f64 fd1641, fd619, fd692;
mul.f64 fd1642, fd620, fd694;
sub.f64 fd700, fd1641, fd1642;
mul.f64 fd1640, fd692, fd423;
mul.f64 fd701, fd619, fd694;
fma.rn.f64 fd702, fd620, fd692, fd701;
mul.f64 fd704, fd702, fd485;
mul.f64 fd705, fd700, fd485;
mul.f64 fd707, fd620, fd702;
mul.f64 fd1639, fd619, fd700;
sub.f64 fd708, fd1639, fd707;
mul.f64 fd1638, fd700, fd467;
mul.f64 fd709, fd619, fd702;
fma.rn.f64 fd710, fd620, fd700, fd709;
mul.f64 fd711, fd708, fd511;
mul.f64 fd712, fd710, fd529;
mul.f64 fd713, fd708, fd529;
ld.global.v2.f64 {fd714, fd715}, [rd6+400];
mul.f64 fd719, fd715, fd573;
mul.f64 fd720, fd714, fd573;
mul.f64 fd1636, fd619, fd714;
mul.f64 fd1637, fd620, fd715;
sub.f64 fd723, fd1636, fd1637;
mul.f64 fd1635, fd714, fd555;
mul.f64 fd724, fd619, fd715;
fma.rn.f64 fd725, fd620, fd714, fd724;
mul.f64 fd727, fd725, fd617;
mul.f64 fd728, fd723, fd617;
mul.f64 fd730, fd620, fd725;
mul.f64 fd1634, fd619, fd723;
sub.f64 fd731, fd1634, fd730;
mul.f64 fd1633, fd723, fd599;
mul.f64 fd732, fd619, fd725;
fma.rn.f64 fd733, fd620, fd723, fd732;
mul.f64 fd735, fd733, fd442;
mul.f64 fd736, fd731, fd442;
mul.f64 fd738, fd620, fd733;
mul.f64 fd1632, fd619, fd731;
sub.f64 fd739, fd1632, fd738;
mul.f64 fd1631, fd731, fd424;
mul.f64 fd740, fd619, fd733;
fma.rn.f64 fd741, fd620, fd731, fd740;
mul.f64 fd743, fd741, fd486;
mul.f64 fd744, fd739, fd486;
mul.f64 fd1629, fd619, fd739;
mul.f64 fd1630, fd620, fd741;
sub.f64 fd747, fd1629, fd1630;
mul.f64 fd1628, fd739, fd468;
mul.f64 fd748, fd619, fd741;
fma.rn.f64 fd749, fd620, fd739, fd748;
mul.f64 fd751, fd749, fd530;
mul.f64 fd752, fd747, fd530;
mul.f64 fd754, fd620, fd749;
mul.f64 fd1627, fd619, fd747;
sub.f64 fd755, fd1627, fd754;
mul.f64 fd1626, fd747, fd512;
mul.f64 fd756, fd619, fd749;
fma.rn.f64 fd757, fd620, fd747, fd756;
mul.f64 fd759, fd757, fd574;
mul.f64 fd760, fd755, fd574;
mul.f64 fd762, fd620, fd757;
mul.f64 fd1625, fd619, fd755;
sub.f64 fd763, fd1625, fd762;
mul.f64 fd1624, fd755, fd556;
mul.f64 fd764, fd619, fd757;
fma.rn.f64 fd765, fd620, fd755, fd764;
mul.f64 fd767, fd765, fd618;
mul.f64 fd768, fd763, fd618;
mul.f64 fd1622, fd619, fd763;
mul.f64 fd1623, fd620, fd765;
sub.f64 fd771, fd1622, fd1623;
mul.f64 fd1621, fd763, fd600;
mul.f64 fd772, fd619, fd765;
fma.rn.f64 fd773, fd620, fd763, fd772;
mul.f64 fd775, fd773, fd434;
mul.f64 fd776, fd771, fd434;
mul.f64 fd778, fd620, fd773;
mul.f64 fd1620, fd619, fd771;
sub.f64 fd779, fd1620, fd778;
mul.f64 fd1619, fd771, fd416;
mul.f64 fd780, fd619, fd773;
fma.rn.f64 fd781, fd620, fd771, fd780;
mul.f64 fd783, fd781, fd478;
mul.f64 fd784, fd779, fd478;
mul.f64 fd1617, fd619, fd779;
mul.f64 fd1618, fd620, fd781;
sub.f64 fd787, fd1617, fd1618;
mul.f64 fd1616, fd779, fd460;
mul.f64 fd788, fd619, fd781;
fma.rn.f64 fd789, fd620, fd779, fd788;
mul.f64 fd791, fd789, fd522;
mul.f64 fd792, fd787, fd522;
mul.f64 fd794, fd620, fd789;
mul.f64 fd1615, fd619, fd787;
sub.f64 fd795, fd1615, fd794;
mul.f64 fd1614, fd787, fd504;
mul.f64 fd796, fd619, fd789;
fma.rn.f64 fd797, fd620, fd787, fd796;
mul.f64 fd799, fd797, fd566;
mul.f64 fd800, fd795, fd566;
mul.f64 fd802, fd620, fd797;
mul.f64 fd1613, fd619, fd795;
sub.f64 fd803, fd1613, fd802;
mul.f64 fd1612, fd619, fd446;
mul.f64 fd804, fd619, fd797;
mul.f64 fd1611, fd795, fd548;
fma.rn.f64 fd805, fd620, fd795, fd804;
mul.f64 fd806, fd803, fd592;
mul.f64 fd807, fd805, fd610;
mul.f64 fd808, fd803, fd610;
barrier.sync 0;
mad.lo.s32 r9, r7, 400, r8;
add.f64 fd809, fd1705, fd1698;
add.f64 fd810, fd403, fd1703;
st.shared.v2.f64 [r9], {fd810, fd809};
fma.rn.f64 fd811, fd620, fd446, fd625;
sub.f64 fd812, fd1612, fd624;
st.shared.v2.f64 [r9+16], {fd812, fd811};
fma.rn.f64 fd813, fd630, fd490, fd633;
sub.f64 fd814, fd1659, fd632;
st.shared.v2.f64 [r9+32], {fd814, fd813};
fma.rn.f64 fd815, fd638, fd534, fd641;
sub.f64 fd816, fd1657, fd640;
st.shared.v2.f64 [r9+48], {fd816, fd815};
fma.rn.f64 fd817, fd646, fd578, fd649;
sub.f64 fd818, fd1654, fd648;
st.shared.v2.f64 [r9+64], {fd818, fd817};
sub.f64 fd819, fd1652, fd656;
fma.rn.f64 fd820, fd654, fd415, fd657;
st.shared.v2.f64 [r9+80], {fd819, fd820};
fma.rn.f64 fd821, fd662, fd459, fd665;
sub.f64 fd822, fd1650, fd664;
st.shared.v2.f64 [r9+96], {fd822, fd821};
sub.f64 fd823, fd1647, fd672;
fma.rn.f64 fd824, fd670, fd503, fd673;
st.shared.v2.f64 [r9+112], {fd823, fd824};
fma.rn.f64 fd825, fd678, fd547, fd681;
sub.f64 fd826, fd1645, fd680;
st.shared.v2.f64 [r9+128], {fd826, fd825};
fma.rn.f64 fd827, fd686, fd591, fd689;
sub.f64 fd828, fd1643, fd688;
st.shared.v2.f64 [r9+144], {fd828, fd827};
fma.rn.f64 fd829, fd694, fd423, fd697;
sub.f64 fd830, fd1640, fd696;
st.shared.v2.f64 [r9+160], {fd830, fd829};
fma.rn.f64 fd831, fd702, fd467, fd705;
sub.f64 fd832, fd1638, fd704;
st.shared.v2.f64 [r9+176], {fd832, fd831};
fma.rn.f64 fd833, fd710, fd511, fd713;
sub.f64 fd834, fd711, fd712;
st.shared.v2.f64 [r9+192], {fd834, fd833};
fma.rn.f64 fd835, fd715, fd555, fd720;
sub.f64 fd836, fd1635, fd719;
st.shared.v2.f64 [r9+208], {fd836, fd835};
fma.rn.f64 fd837, fd725, fd599, fd728;
sub.f64 fd838, fd1633, fd727;
st.shared.v2.f64 [r9+224], {fd838, fd837};
fma.rn.f64 fd839, fd733, fd424, fd736;
sub.f64 fd840, fd1631, fd735;
st.shared.v2.f64 [r9+240], {fd840, fd839};
fma.rn.f64 fd841, fd741, fd468, fd744;
sub.f64 fd842, fd1628, fd743;
st.shared.v2.f64 [r9+256], {fd842, fd841};
fma.rn.f64 fd843, fd749, fd512, fd752;
sub.f64 fd844, fd1626, fd751;
st.shared.v2.f64 [r9+272], {fd844, fd843};
fma.rn.f64 fd845, fd757, fd556, fd760;
sub.f64 fd846, fd1624, fd759;
st.shared.v2.f64 [r9+288], {fd846, fd845};
sub.f64 fd847, fd1621, fd767;
fma.rn.f64 fd848, fd765, fd600, fd768;
st.shared.v2.f64 [r9+304], {fd847, fd848};
fma.rn.f64 fd849, fd773, fd416, fd776;
sub.f64 fd850, fd1619, fd775;
st.shared.v2.f64 [r9+320], {fd850, fd849};
fma.rn.f64 fd851, fd781, fd460, fd784;
sub.f64 fd852, fd1616, fd783;
st.shared.v2.f64 [r9+336], {fd852, fd851};
fma.rn.f64 fd853, fd789, fd504, fd792;
sub.f64 fd854, fd1614, fd791;
st.shared.v2.f64 [r9+352], {fd854, fd853};
fma.rn.f64 fd855, fd797, fd548, fd800;
sub.f64 fd856, fd1611, fd799;
st.shared.v2.f64 [r9+368], {fd856, fd855};
fma.rn.f64 fd857, fd805, fd592, fd808;
sub.f64 fd858, fd806, fd807;
st.shared.v2.f64 [r9+384], {fd858, fd857};
barrier.sync 0;
mad.lo.s32 r10, r7, -384, r9;
ld.shared.v2.f64 {fd859, fd860}, [r10];
ld.shared.v2.f64 {fd863, fd864}, [r10+400];
ld.shared.v2.f64 {fd867, fd868}, [r10+800];
ld.shared.v2.f64 {fd871, fd872}, [r10+1200];
ld.shared.v2.f64 {fd875, fd876}, [r10+1600];
ld.shared.v2.f64 {fd879, fd880}, [r10+2000];
ld.shared.v2.f64 {fd883, fd884}, [r10+2400];
ld.shared.v2.f64 {fd887, fd888}, [r10+2800];
ld.shared.v2.f64 {fd891, fd892}, [r10+3200];
ld.shared.v2.f64 {fd895, fd896}, [r10+3600];
ld.shared.v2.f64 {fd899, fd900}, [r10+4000];
ld.shared.v2.f64 {fd903, fd904}, [r10+4400];
ld.shared.v2.f64 {fd907, fd908}, [r10+4800];
ld.shared.v2.f64 {fd911, fd912}, [r10+5200];
ld.shared.v2.f64 {fd915, fd916}, [r10+5600];
ld.shared.v2.f64 {fd919, fd920}, [r10+6000];
ld.shared.v2.f64 {fd923, fd924}, [r10+6400];
ld.shared.v2.f64 {fd927, fd928}, [r10+6800];
ld.shared.v2.f64 {fd931, fd932}, [r10+7200];
ld.shared.v2.f64 {fd935, fd936}, [r10+7600];
ld.shared.v2.f64 {fd939, fd940}, [r10+8000];
ld.shared.v2.f64 {fd943, fd944}, [r10+8400];
ld.shared.v2.f64 {fd947, fd948}, [r10+8800];
ld.shared.v2.f64 {fd951, fd952}, [r10+9200];
ld.shared.v2.f64 {fd955, fd956}, [r10+9600];
add.f64 fd959, fd879, fd939;
add.f64 fd961, fd899, fd919;
add.f64 fd1610, fd859, fd959;
add.f64 fd962, fd961, fd1610;
add.f64 fd963, fd880, fd940;
add.f64 fd965, fd900, fd920;
add.f64 fd1609, fd860, fd963;
add.f64 fd966, fd965, fd1609;
mul.f64 fd968, fd961, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1608, fd959, 0d3FD3C6EF372FE950, fd859;
sub.f64 fd969, fd1608, fd968;
sub.f64 fd970, fd880, fd940;
sub.f64 fd972, fd900, fd920;
mul.f64 fd1606, fd970, 0d3FEE6F0E134454FF;
mul.f64 fd1607, fd972, 0dBFE2CF2304755A5E;
sub.f64 fd974, fd1607, fd1606;
sub.f64 fd975, fd969, fd974;
add.f64 fd976, fd974, fd969;
mul.f64 fd977, fd959, 0d3FE9E3779B97F4A8;
sub.f64 fd978, fd859, fd977;
fma.rn.f64 fd979, fd961, 0d3FD3C6EF372FE950, fd978;
mul.f64 fd980, fd970, 0d3FE2CF2304755A5E;
mul.f64 fd981, fd972, 0d3FEE6F0E134454FF;
sub.f64 fd982, fd981, fd980;
sub.f64 fd983, fd979, fd982;
add.f64 fd984, fd982, fd979;
fma.rn.f64 fd1604, fd963, 0d3FD3C6EF372FE950, fd860;
mul.f64 fd1605, fd965, 0d3FE9E3779B97F4A8;
sub.f64 fd987, fd1604, fd1605;
sub.f64 fd988, fd879, fd939;
sub.f64 fd990, fd899, fd919;
mul.f64 fd1602, fd988, 0d3FEE6F0E134454FF;
mul.f64 fd1603, fd990, 0dBFE2CF2304755A5E;
sub.f64 fd992, fd1603, fd1602;
add.f64 fd993, fd992, fd987;
sub.f64 fd994, fd987, fd992;
mul.f64 fd995, fd963, 0d3FE9E3779B97F4A8;
sub.f64 fd996, fd860, fd995;
fma.rn.f64 fd997, fd965, 0d3FD3C6EF372FE950, fd996;
mul.f64 fd998, fd988, 0d3FE2CF2304755A5E;
mul.f64 fd999, fd990, 0d3FEE6F0E134454FF;
sub.f64 fd1000, fd999, fd998;
add.f64 fd1001, fd1000, fd997;
sub.f64 fd1002, fd997, fd1000;
add.f64 fd1003, fd883, fd943;
add.f64 fd1005, fd903, fd923;
add.f64 fd1601, fd863, fd1003;
add.f64 fd1006, fd1005, fd1601;
add.f64 fd1007, fd884, fd944;
add.f64 fd1009, fd904, fd924;
add.f64 fd1600, fd864, fd1007;
add.f64 fd1010, fd1009, fd1600;
fma.rn.f64 fd1598, fd1003, 0d3FD3C6EF372FE950, fd863;
mul.f64 fd1599, fd1005, 0d3FE9E3779B97F4A8;
sub.f64 fd1013, fd1598, fd1599;
sub.f64 fd1014, fd884, fd944;
sub.f64 fd1016, fd904, fd924;
mul.f64 fd1596, fd1014, 0d3FEE6F0E134454FF;
mul.f64 fd1597, fd1016, 0dBFE2CF2304755A5E;
sub.f64 fd1018, fd1597, fd1596;
sub.f64 fd1019, fd1013, fd1018;
add.f64 fd1020, fd1018, fd1013;
mul.f64 fd1021, fd1003, 0d3FE9E3779B97F4A8;
sub.f64 fd1022, fd863, fd1021;
fma.rn.f64 fd1023, fd1005, 0d3FD3C6EF372FE950, fd1022;
mul.f64 fd1024, fd1014, 0d3FE2CF2304755A5E;
mul.f64 fd1025, fd1016, 0d3FEE6F0E134454FF;
sub.f64 fd1026, fd1025, fd1024;
sub.f64 fd1027, fd1023, fd1026;
add.f64 fd1028, fd1026, fd1023;
mul.f64 fd1030, fd1009, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1595, fd1007, 0d3FD3C6EF372FE950, fd864;
sub.f64 fd1031, fd1595, fd1030;
sub.f64 fd1032, fd883, fd943;
sub.f64 fd1034, fd903, fd923;
mul.f64 fd1035, fd1034, 0dBFE2CF2304755A5E;
mul.f64 fd1594, fd1032, 0d3FEE6F0E134454FF;
sub.f64 fd1036, fd1035, fd1594;
add.f64 fd1037, fd1036, fd1031;
sub.f64 fd1038, fd1031, fd1036;
mul.f64 fd1039, fd1007, 0d3FE9E3779B97F4A8;
sub.f64 fd1040, fd864, fd1039;
fma.rn.f64 fd1041, fd1009, 0d3FD3C6EF372FE950, fd1040;
mul.f64 fd1042, fd1032, 0d3FE2CF2304755A5E;
mul.f64 fd1043, fd1034, 0d3FEE6F0E134454FF;
sub.f64 fd1044, fd1043, fd1042;
add.f64 fd1045, fd1044, fd1041;
sub.f64 fd1046, fd1041, fd1044;
add.f64 fd1047, fd887, fd947;
add.f64 fd1049, fd907, fd927;
add.f64 fd1593, fd867, fd1047;
add.f64 fd1050, fd1049, fd1593;
add.f64 fd1051, fd888, fd948;
add.f64 fd1053, fd908, fd928;
add.f64 fd1592, fd868, fd1051;
add.f64 fd1054, fd1053, fd1592;
mul.f64 fd1056, fd1049, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1591, fd1047, 0d3FD3C6EF372FE950, fd867;
sub.f64 fd1057, fd1591, fd1056;
sub.f64 fd1058, fd888, fd948;
sub.f64 fd1060, fd908, fd928;
mul.f64 fd1061, fd1060, 0dBFE2CF2304755A5E;
mul.f64 fd1590, fd1058, 0d3FEE6F0E134454FF;
sub.f64 fd1062, fd1061, fd1590;
sub.f64 fd1063, fd1057, fd1062;
add.f64 fd1064, fd1062, fd1057;
mul.f64 fd1065, fd1047, 0d3FE9E3779B97F4A8;
sub.f64 fd1066, fd867, fd1065;
fma.rn.f64 fd1067, fd1049, 0d3FD3C6EF372FE950, fd1066;
mul.f64 fd1068, fd1058, 0d3FE2CF2304755A5E;
mul.f64 fd1069, fd1060, 0d3FEE6F0E134454FF;
sub.f64 fd1070, fd1069, fd1068;
sub.f64 fd1071, fd1067, fd1070;
add.f64 fd1072, fd1070, fd1067;
fma.rn.f64 fd1588, fd1051, 0d3FD3C6EF372FE950, fd868;
mul.f64 fd1589, fd1053, 0d3FE9E3779B97F4A8;
sub.f64 fd1075, fd1588, fd1589;
sub.f64 fd1076, fd887, fd947;
sub.f64 fd1078, fd907, fd927;
mul.f64 fd1586, fd1076, 0d3FEE6F0E134454FF;
mul.f64 fd1587, fd1078, 0dBFE2CF2304755A5E;
sub.f64 fd1080, fd1587, fd1586;
add.f64 fd1081, fd1080, fd1075;
sub.f64 fd1082, fd1075, fd1080;
mul.f64 fd1083, fd1051, 0d3FE9E3779B97F4A8;
sub.f64 fd1084, fd868, fd1083;
fma.rn.f64 fd1085, fd1053, 0d3FD3C6EF372FE950, fd1084;
mul.f64 fd1086, fd1076, 0d3FE2CF2304755A5E;
mul.f64 fd1087, fd1078, 0d3FEE6F0E134454FF;
sub.f64 fd1088, fd1087, fd1086;
add.f64 fd1089, fd1088, fd1085;
sub.f64 fd1090, fd1085, fd1088;
add.f64 fd1091, fd891, fd951;
add.f64 fd1093, fd911, fd931;
add.f64 fd1585, fd871, fd1091;
add.f64 fd1094, fd1093, fd1585;
add.f64 fd1095, fd892, fd952;
add.f64 fd1097, fd912, fd932;
add.f64 fd1584, fd872, fd1095;
add.f64 fd1098, fd1097, fd1584;
fma.rn.f64 fd1582, fd1091, 0d3FD3C6EF372FE950, fd871;
mul.f64 fd1583, fd1093, 0d3FE9E3779B97F4A8;
sub.f64 fd1101, fd1582, fd1583;
sub.f64 fd1102, fd892, fd952;
sub.f64 fd1104, fd912, fd932;
mul.f64 fd1580, fd1102, 0d3FEE6F0E134454FF;
mul.f64 fd1581, fd1104, 0dBFE2CF2304755A5E;
sub.f64 fd1106, fd1581, fd1580;
sub.f64 fd1107, fd1101, fd1106;
add.f64 fd1108, fd1106, fd1101;
mul.f64 fd1109, fd1091, 0d3FE9E3779B97F4A8;
sub.f64 fd1110, fd871, fd1109;
fma.rn.f64 fd1111, fd1093, 0d3FD3C6EF372FE950, fd1110;
mul.f64 fd1112, fd1102, 0d3FE2CF2304755A5E;
mul.f64 fd1113, fd1104, 0d3FEE6F0E134454FF;
sub.f64 fd1114, fd1113, fd1112;
sub.f64 fd1115, fd1111, fd1114;
add.f64 fd1116, fd1114, fd1111;
mul.f64 fd1118, fd1097, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1579, fd1095, 0d3FD3C6EF372FE950, fd872;
sub.f64 fd1119, fd1579, fd1118;
sub.f64 fd1120, fd891, fd951;
sub.f64 fd1122, fd911, fd931;
mul.f64 fd1577, fd1120, 0d3FEE6F0E134454FF;
mul.f64 fd1578, fd1122, 0dBFE2CF2304755A5E;
sub.f64 fd1124, fd1578, fd1577;
add.f64 fd1125, fd1124, fd1119;
sub.f64 fd1126, fd1119, fd1124;
mul.f64 fd1127, fd1095, 0d3FE9E3779B97F4A8;
sub.f64 fd1128, fd872, fd1127;
fma.rn.f64 fd1129, fd1097, 0d3FD3C6EF372FE950, fd1128;
mul.f64 fd1130, fd1120, 0d3FE2CF2304755A5E;
mul.f64 fd1131, fd1122, 0d3FEE6F0E134454FF;
sub.f64 fd1132, fd1131, fd1130;
add.f64 fd1133, fd1132, fd1129;
sub.f64 fd1134, fd1129, fd1132;
add.f64 fd1135, fd895, fd955;
add.f64 fd1137, fd915, fd935;
add.f64 fd1576, fd875, fd1135;
add.f64 fd1138, fd1137, fd1576;
add.f64 fd1139, fd896, fd956;
add.f64 fd1141, fd916, fd936;
add.f64 fd1575, fd876, fd1139;
add.f64 fd1142, fd1141, fd1575;
mul.f64 fd1144, fd1137, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1574, fd1135, 0d3FD3C6EF372FE950, fd875;
sub.f64 fd1145, fd1574, fd1144;
sub.f64 fd1146, fd896, fd956;
sub.f64 fd1148, fd916, fd936;
mul.f64 fd1572, fd1146, 0d3FEE6F0E134454FF;
mul.f64 fd1573, fd1148, 0dBFE2CF2304755A5E;
sub.f64 fd1150, fd1573, fd1572;
sub.f64 fd1151, fd1145, fd1150;
add.f64 fd1152, fd1150, fd1145;
mul.f64 fd1153, fd1135, 0d3FE9E3779B97F4A8;
sub.f64 fd1154, fd875, fd1153;
fma.rn.f64 fd1155, fd1137, 0d3FD3C6EF372FE950, fd1154;
mul.f64 fd1156, fd1146, 0d3FE2CF2304755A5E;
mul.f64 fd1157, fd1148, 0d3FEE6F0E134454FF;
sub.f64 fd1158, fd1157, fd1156;
sub.f64 fd1159, fd1155, fd1158;
add.f64 fd1160, fd1158, fd1155;
mul.f64 fd1162, fd1141, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1571, fd1139, 0d3FD3C6EF372FE950, fd876;
sub.f64 fd1163, fd1571, fd1162;
sub.f64 fd1164, fd895, fd955;
sub.f64 fd1166, fd915, fd935;
mul.f64 fd1569, fd1164, 0d3FEE6F0E134454FF;
mul.f64 fd1570, fd1166, 0dBFE2CF2304755A5E;
sub.f64 fd1168, fd1570, fd1569;
add.f64 fd1169, fd1168, fd1163;
sub.f64 fd1170, fd1163, fd1168;
mul.f64 fd1171, fd1139, 0d3FE9E3779B97F4A8;
sub.f64 fd1172, fd876, fd1171;
fma.rn.f64 fd1173, fd1141, 0d3FD3C6EF372FE950, fd1172;
mul.f64 fd1174, fd1164, 0d3FE2CF2304755A5E;
mul.f64 fd1175, fd1166, 0d3FEE6F0E134454FF;
sub.f64 fd1176, fd1175, fd1174;
add.f64 fd1177, fd1176, fd1173;
sub.f64 fd1178, fd1173, fd1176;
mul.f64 fd1567, fd1019, 0d3FEEFEA21D101EE0;
mul.f64 fd1568, fd1037, 0dBFCFD511FA1C0796;
sub.f64 fd1181, fd1567, fd1568;
mul.f64 fd1182, fd1037, 0d3FEEFEA21D101EE0;
fma.rn.f64 fd1183, fd1019, 0dBFCFD511FA1C0796, fd1182;
mul.f64 fd1565, fd1063, 0d3FEC0AB44E81C059;
mul.f64 fd1566, fd1081, 0dBFDED50D5CBFA951;
sub.f64 fd1186, fd1565, fd1566;
mul.f64 fd1187, fd1081, 0d3FEC0AB44E81C059;
fma.rn.f64 fd1188, fd1063, 0dBFDED50D5CBFA951, fd1187;
mul.f64 fd1563, fd1107, 0d3FE753B603D2B816;
mul.f64 fd1564, fd1125, 0dBFE5E7CF55112014;
sub.f64 fd1191, fd1563, fd1564;
mul.f64 fd1192, fd1125, 0d3FE753B603D2B816;
fma.rn.f64 fd1193, fd1107, 0dBFE5E7CF55112014, fd1192;
mul.f64 fd1195, fd1169, 0dBFEB04BBFF642E86;
mul.f64 fd1562, fd1151, 0d3FE1257E3C182B51;
sub.f64 fd1196, fd1562, fd1195;
mul.f64 fd1197, fd1169, 0d3FE1257E3C182B51;
fma.rn.f64 fd1198, fd1151, 0dBFEB04BBFF642E86, fd1197;
mul.f64 fd1200, fd1045, 0dBFDED50D5CBFA951;
mul.f64 fd1561, fd1027, 0d3FEC0AB44E81C059;
sub.f64 fd1201, fd1561, fd1200;
mul.f64 fd1202, fd1045, 0d3FEC0AB44E81C059;
fma.rn.f64 fd1203, fd1027, 0dBFDED50D5CBFA951, fd1202;
mul.f64 fd1205, fd1089, 0dBFEB04BBFF642E86;
mul.f64 fd1560, fd1071, 0d3FE1257E3C182B51;
sub.f64 fd1206, fd1560, fd1205;
mul.f64 fd1207, fd1089, 0d3FE1257E3C182B51;
fma.rn.f64 fd1208, fd1071, 0dBFEB04BBFF642E86, fd1207;
mul.f64 fd1210, fd1133, 0dBFEFEFD5BFE443FE;
mul.f64 fd1559, fd1115, 0d3FB0130A1BE09379;
sub.f64 fd1211, fd1559, fd1210;
mul.f64 fd1212, fd1133, 0d3FB0130A1BE09379;
fma.rn.f64 fd1213, fd1115, 0dBFEFEFD5BFE443FE, fd1212;
mul.f64 fd1215, fd1177, 0dBFECF457DCDC158C;
mul.f64 fd1558, fd1159, 0dBFDB3FF7C925819C;
sub.f64 fd1216, fd1558, fd1215;
mul.f64 fd1217, fd1177, 0dBFDB3FF7C925819C;
fma.rn.f64 fd1218, fd1159, 0dBFECF457DCDC158C, fd1217;
mul.f64 fd1556, fd1028, 0d3FE753B603D2B816;
mul.f64 fd1557, fd1046, 0dBFE5E7CF55112014;
sub.f64 fd1221, fd1556, fd1557;
mul.f64 fd1222, fd1046, 0d3FE753B603D2B816;
fma.rn.f64 fd1223, fd1028, 0dBFE5E7CF55112014, fd1222;
mul.f64 fd1554, fd1072, 0d3FB0130A1BE09379;
mul.f64 fd1555, fd1090, 0dBFEFEFD5BFE443FE;
sub.f64 fd1226, fd1554, fd1555;
mul.f64 fd1227, fd1090, 0d3FB0130A1BE09379;
fma.rn.f64 fd1228, fd1072, 0dBFEFEFD5BFE443FE, fd1227;
mul.f64 fd1552, fd1116, 0dBFE465C6FEB501BC;
mul.f64 fd1553, fd1134, 0dBFE8A80B635B6BEA;
sub.f64 fd1231, fd1552, fd1553;
mul.f64 fd1232, fd1134, 0dBFE465C6FEB501BC;
fma.rn.f64 fd1233, fd1116, 0dBFE8A80B635B6BEA, fd1232;
mul.f64 fd1550, fd1160, 0dBFEFBF675480D903;
mul.f64 fd1551, fd1178, 0dBFC00AEB5DA15BE0;
sub.f64 fd1236, fd1550, fd1551;
mul.f64 fd1237, fd1178, 0dBFEFBF675480D903;
fma.rn.f64 fd1238, fd1160, 0dBFC00AEB5DA15BE0, fd1237;
mul.f64 fd1240, fd1038, 0dBFEB04BBFF642E86;
mul.f64 fd1549, fd1020, 0d3FE1257E3C182B51;
sub.f64 fd1241, fd1549, fd1240;
mul.f64 fd1242, fd1038, 0d3FE1257E3C182B51;
fma.rn.f64 fd1243, fd1020, 0dBFEB04BBFF642E86, fd1242;
mul.f64 fd1245, fd1082, 0dBFECF457DCDC158C;
mul.f64 fd1548, fd1064, 0dBFDB3FF7C925819C;
sub.f64 fd1246, fd1548, fd1245;
mul.f64 fd1247, fd1082, 0dBFDB3FF7C925819C;
fma.rn.f64 fd1248, fd1064, 0dBFECF457DCDC158C, fd1247;
mul.f64 fd1250, fd1126, 0dBFC00AEB5DA15BE0;
mul.f64 fd1547, fd1108, 0dBFEFBF675480D903;
sub.f64 fd1251, fd1547, fd1250;
mul.f64 fd1252, fd1126, 0dBFEFBF675480D903;
fma.rn.f64 fd1253, fd1108, 0dBFC00AEB5DA15BE0, fd1252;
mul.f64 fd1255, fd1170, 0d3FE8A80B635B6BEA;
mul.f64 fd1546, fd1152, 0dBFE465C6FEB501BC;
sub.f64 fd1256, fd1546, fd1255;
mul.f64 fd1257, fd1170, 0dBFE465C6FEB501BC;
fma.rn.f64 fd1258, fd1152, 0d3FE8A80B635B6BEA, fd1257;
add.f64 fd1259, fd1006, fd1138;
add.f64 fd1261, fd1050, fd1094;
fma.rn.f64 fd1544, fd1259, 0d3FD3C6EF372FE950, fd962;
mul.f64 fd1545, fd1261, 0d3FE9E3779B97F4A8;
sub.f64 fd1267, fd1544, fd1545;
add.f64 fd1543, fd1010, fd1142;
sub.f64 fd1268, fd1010, fd1142;
add.f64 fd1542, fd1054, fd1098;
sub.f64 fd1270, fd1054, fd1098;
mul.f64 fd1540, fd1268, 0d3FEE6F0E134454FF;
mul.f64 fd1541, fd1270, 0dBFE2CF2304755A5E;
sub.f64 fd1272, fd1541, fd1540;
add.f64 fd1539, fd962, fd1259;
mul.f64 fd1273, fd1259, 0d3FE9E3779B97F4A8;
sub.f64 fd1274, fd962, fd1273;
fma.rn.f64 fd1275, fd1261, 0d3FD3C6EF372FE950, fd1274;
mul.f64 fd1276, fd1268, 0d3FE2CF2304755A5E;
mul.f64 fd1277, fd1270, 0d3FEE6F0E134454FF;
sub.f64 fd1278, fd1277, fd1276;
fma.rn.f64 fd1537, fd1543, 0d3FD3C6EF372FE950, fd966;
mul.f64 fd1538, fd1542, 0d3FE9E3779B97F4A8;
sub.f64 fd1281, fd1537, fd1538;
sub.f64 fd1282, fd1006, fd1138;
sub.f64 fd1284, fd1050, fd1094;
mul.f64 fd1535, fd1282, 0d3FEE6F0E134454FF;
mul.f64 fd1536, fd1284, 0dBFE2CF2304755A5E;
sub.f64 fd1286, fd1536, fd1535;
add.f64 fd1534, fd966, fd1543;
mul.f64 fd1287, fd1543, 0d3FE9E3779B97F4A8;
sub.f64 fd1288, fd966, fd1287;
fma.rn.f64 fd1289, fd1542, 0d3FD3C6EF372FE950, fd1288;
mul.f64 fd1290, fd1282, 0d3FE2CF2304755A5E;
mul.f64 fd1291, fd1284, 0d3FEE6F0E134454FF;
sub.f64 fd1292, fd1291, fd1290;
add.f64 fd1293, fd1181, fd1196;
add.f64 fd1295, fd1186, fd1191;
mul.f64 fd1300, fd1295, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1533, fd1293, 0d3FD3C6EF372FE950, fd975;
sub.f64 fd1301, fd1533, fd1300;
add.f64 fd1532, fd1183, fd1198;
sub.f64 fd1302, fd1183, fd1198;
add.f64 fd1531, fd1188, fd1193;
sub.f64 fd1304, fd1188, fd1193;
mul.f64 fd1305, fd1304, 0dBFE2CF2304755A5E;
mul.f64 fd1530, fd1302, 0d3FEE6F0E134454FF;
sub.f64 fd1306, fd1305, fd1530;
add.f64 fd1529, fd975, fd1293;
mul.f64 fd1307, fd1293, 0d3FE9E3779B97F4A8;
sub.f64 fd1308, fd975, fd1307;
fma.rn.f64 fd1309, fd1295, 0d3FD3C6EF372FE950, fd1308;
mul.f64 fd1310, fd1302, 0d3FE2CF2304755A5E;
mul.f64 fd1311, fd1304, 0d3FEE6F0E134454FF;
sub.f64 fd1312, fd1311, fd1310;
mul.f64 fd1314, fd1531, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1528, fd1532, 0d3FD3C6EF372FE950, fd993;
sub.f64 fd1315, fd1528, fd1314;
sub.f64 fd1316, fd1181, fd1196;
sub.f64 fd1318, fd1186, fd1191;
mul.f64 fd1526, fd1316, 0d3FEE6F0E134454FF;
mul.f64 fd1527, fd1318, 0dBFE2CF2304755A5E;
sub.f64 fd1320, fd1527, fd1526;
add.f64 fd1525, fd993, fd1532;
mul.f64 fd1321, fd1532, 0d3FE9E3779B97F4A8;
sub.f64 fd1322, fd993, fd1321;
fma.rn.f64 fd1323, fd1531, 0d3FD3C6EF372FE950, fd1322;
mul.f64 fd1324, fd1316, 0d3FE2CF2304755A5E;
mul.f64 fd1325, fd1318, 0d3FEE6F0E134454FF;
sub.f64 fd1326, fd1325, fd1324;
add.f64 fd1327, fd1201, fd1216;
add.f64 fd1329, fd1206, fd1211;
fma.rn.f64 fd1523, fd1327, 0d3FD3C6EF372FE950, fd983;
mul.f64 fd1524, fd1329, 0d3FE9E3779B97F4A8;
sub.f64 fd1335, fd1523, fd1524;
add.f64 fd1522, fd1203, fd1218;
sub.f64 fd1336, fd1203, fd1218;
add.f64 fd1521, fd1208, fd1213;
sub.f64 fd1338, fd1208, fd1213;
mul.f64 fd1519, fd1336, 0d3FEE6F0E134454FF;
mul.f64 fd1520, fd1338, 0dBFE2CF2304755A5E;
sub.f64 fd1340, fd1520, fd1519;
add.f64 fd1518, fd983, fd1327;
mul.f64 fd1341, fd1327, 0d3FE9E3779B97F4A8;
sub.f64 fd1342, fd983, fd1341;
fma.rn.f64 fd1343, fd1329, 0d3FD3C6EF372FE950, fd1342;
mul.f64 fd1344, fd1336, 0d3FE2CF2304755A5E;
mul.f64 fd1345, fd1338, 0d3FEE6F0E134454FF;
sub.f64 fd1346, fd1345, fd1344;
fma.rn.f64 fd1516, fd1522, 0d3FD3C6EF372FE950, fd1001;
mul.f64 fd1517, fd1521, 0d3FE9E3779B97F4A8;
sub.f64 fd1349, fd1516, fd1517;
sub.f64 fd1350, fd1201, fd1216;
sub.f64 fd1352, fd1206, fd1211;
mul.f64 fd1514, fd1350, 0d3FEE6F0E134454FF;
mul.f64 fd1515, fd1352, 0dBFE2CF2304755A5E;
sub.f64 fd1354, fd1515, fd1514;
add.f64 fd1513, fd1001, fd1522;
mul.f64 fd1355, fd1522, 0d3FE9E3779B97F4A8;
sub.f64 fd1356, fd1001, fd1355;
fma.rn.f64 fd1357, fd1521, 0d3FD3C6EF372FE950, fd1356;
mul.f64 fd1358, fd1350, 0d3FE2CF2304755A5E;
mul.f64 fd1359, fd1352, 0d3FEE6F0E134454FF;
sub.f64 fd1360, fd1359, fd1358;
add.f64 fd1361, fd1221, fd1236;
add.f64 fd1363, fd1226, fd1231;
mul.f64 fd1368, fd1363, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1512, fd1361, 0d3FD3C6EF372FE950, fd984;
sub.f64 fd1369, fd1512, fd1368;
add.f64 fd1511, fd1223, fd1238;
sub.f64 fd1370, fd1223, fd1238;
add.f64 fd1510, fd1228, fd1233;
sub.f64 fd1372, fd1228, fd1233;
mul.f64 fd1508, fd1370, 0d3FEE6F0E134454FF;
mul.f64 fd1509, fd1372, 0dBFE2CF2304755A5E;
sub.f64 fd1374, fd1509, fd1508;
add.f64 fd1507, fd984, fd1361;
mul.f64 fd1375, fd1361, 0d3FE9E3779B97F4A8;
sub.f64 fd1376, fd984, fd1375;
fma.rn.f64 fd1377, fd1363, 0d3FD3C6EF372FE950, fd1376;
mul.f64 fd1378, fd1370, 0d3FE2CF2304755A5E;
mul.f64 fd1379, fd1372, 0d3FEE6F0E134454FF;
sub.f64 fd1380, fd1379, fd1378;
fma.rn.f64 fd1505, fd1511, 0d3FD3C6EF372FE950, fd1002;
mul.f64 fd1506, fd1510, 0d3FE9E3779B97F4A8;
sub.f64 fd1383, fd1505, fd1506;
sub.f64 fd1384, fd1221, fd1236;
sub.f64 fd1386, fd1226, fd1231;
mul.f64 fd1503, fd1384, 0d3FEE6F0E134454FF;
mul.f64 fd1504, fd1386, 0dBFE2CF2304755A5E;
sub.f64 fd1388, fd1504, fd1503;
add.f64 fd1502, fd1002, fd1511;
mul.f64 fd1389, fd1511, 0d3FE9E3779B97F4A8;
sub.f64 fd1390, fd1002, fd1389;
fma.rn.f64 fd1391, fd1510, 0d3FD3C6EF372FE950, fd1390;
mul.f64 fd1392, fd1384, 0d3FE2CF2304755A5E;
mul.f64 fd1393, fd1386, 0d3FEE6F0E134454FF;
sub.f64 fd1394, fd1393, fd1392;
add.f64 fd1395, fd1241, fd1256;
add.f64 fd1397, fd1246, fd1251;
mul.f64 fd1402, fd1397, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1501, fd1395, 0d3FD3C6EF372FE950, fd976;
sub.f64 fd1403, fd1501, fd1402;
add.f64 fd1500, fd1243, fd1258;
sub.f64 fd1404, fd1243, fd1258;
add.f64 fd1499, fd1248, fd1253;
sub.f64 fd1406, fd1248, fd1253;
mul.f64 fd1407, fd1406, 0dBFE2CF2304755A5E;
mul.f64 fd1498, fd1404, 0d3FEE6F0E134454FF;
sub.f64 fd1408, fd1407, fd1498;
add.f64 fd1497, fd976, fd1395;
mul.f64 fd1409, fd1395, 0d3FE9E3779B97F4A8;
sub.f64 fd1410, fd976, fd1409;
fma.rn.f64 fd1411, fd1397, 0d3FD3C6EF372FE950, fd1410;
mul.f64 fd1412, fd1404, 0d3FE2CF2304755A5E;
mul.f64 fd1413, fd1406, 0d3FEE6F0E134454FF;
sub.f64 fd1414, fd1413, fd1412;
mul.f64 fd1416, fd1499, 0d3FE9E3779B97F4A8;
fma.rn.f64 fd1496, fd1500, 0d3FD3C6EF372FE950, fd994;
sub.f64 fd1417, fd1496, fd1416;
sub.f64 fd1418, fd1241, fd1256;
sub.f64 fd1420, fd1246, fd1251;
mul.f64 fd1494, fd1418, 0d3FEE6F0E134454FF;
mul.f64 fd1495, fd1420, 0dBFE2CF2304755A5E;
sub.f64 fd1422, fd1495, fd1494;
add.f64 fd1493, fd994, fd1500;
mul.f64 fd1423, fd1500, 0d3FE9E3779B97F4A8;
sub.f64 fd1424, fd994, fd1423;
fma.rn.f64 fd1425, fd1499, 0d3FD3C6EF372FE950, fd1424;
mul.f64 fd1426, fd1418, 0d3FE2CF2304755A5E;
mul.f64 fd1427, fd1420, 0d3FEE6F0E134454FF;
sub.f64 fd1428, fd1427, fd1426;
add.f64 %1, fd1542, fd1534;
add.f64 %0, fd1261, fd1539;
add.f64 %3, fd1531, fd1525;
add.f64 %2, fd1295, fd1529;
add.f64 %5, fd1521, fd1513;
add.f64 %4, fd1329, fd1518;
add.f64 %7, fd1510, fd1502;
add.f64 %6, fd1363, fd1507;
add.f64 %9, fd1499, fd1493;
add.f64 %8, fd1397, fd1497;
sub.f64 %10, fd1267, fd1272;
add.f64 %11, fd1286, fd1281;
sub.f64 %12, fd1301, fd1306;
add.f64 %13, fd1320, fd1315;
sub.f64 %14, fd1335, fd1340;
add.f64 %15, fd1354, fd1349;
add.f64 %17, fd1388, fd1383;
sub.f64 %16, fd1369, fd1374;
add.f64 %19, fd1422, fd1417;
sub.f64 %18, fd1403, fd1408;
add.f64 %21, fd1292, fd1289;
sub.f64 %20, fd1275, fd1278;
sub.f64 %22, fd1309, fd1312;
add.f64 %23, fd1326, fd1323;
sub.f64 %24, fd1343, fd1346;
add.f64 %25, fd1360, fd1357;
sub.f64 %26, fd1377, fd1380;
add.f64 %27, fd1394, fd1391;
add.f64 %29, fd1428, fd1425;
sub.f64 %28, fd1411, fd1414;
sub.f64 %31, fd1289, fd1292;
add.f64 %30, fd1278, fd1275;
sub.f64 %33, fd1323, fd1326;
add.f64 %32, fd1312, fd1309;
sub.f64 %35, fd1357, fd1360;
add.f64 %34, fd1346, fd1343;
sub.f64 %37, fd1391, fd1394;
add.f64 %36, fd1380, fd1377;
sub.f64 %39, fd1425, fd1428;
add.f64 %38, fd1414, fd1411;
sub.f64 %41, fd1281, fd1286;
add.f64 %40, fd1272, fd1267;
sub.f64 %43, fd1315, fd1320;
add.f64 %42, fd1306, fd1301;
sub.f64 %45, fd1349, fd1354;
add.f64 %44, fd1340, fd1335;
sub.f64 %47, fd1383, fd1388;
add.f64 %46, fd1374, fd1369;
sub.f64 %49, fd1417, fd1422;
add.f64 %48, fd1408, fd1403;
})"
     : "=d"(rmem[0].x), "=d"(rmem[0].y), "=d"(rmem[1].x), "=d"(rmem[1].y), "=d"(rmem[2].x), "=d"(rmem[2].y), "=d"(rmem[3].x), "=d"(rmem[3].y), "=d"(rmem[4].x), "=d"(rmem[4].y), "=d"(rmem[5].x), "=d"(rmem[5].y), "=d"(rmem[6].x), "=d"(rmem[6].y), "=d"(rmem[7].x), "=d"(rmem[7].y), "=d"(rmem[8].x), "=d"(rmem[8].y), "=d"(rmem[9].x), "=d"(rmem[9].y), "=d"(rmem[10].x), "=d"(rmem[10].y), "=d"(rmem[11].x), "=d"(rmem[11].y), "=d"(rmem[12].x), "=d"(rmem[12].y), "=d"(rmem[13].x), "=d"(rmem[13].y), "=d"(rmem[14].x), "=d"(rmem[14].y), "=d"(rmem[15].x), "=d"(rmem[15].y), "=d"(rmem[16].x), "=d"(rmem[16].y), "=d"(rmem[17].x), "=d"(rmem[17].y), "=d"(rmem[18].x), "=d"(rmem[18].y), "=d"(rmem[19].x), "=d"(rmem[19].y), "=d"(rmem[20].x), "=d"(rmem[20].y), "=d"(rmem[21].x), "=d"(rmem[21].y), "=d"(rmem[22].x), "=d"(rmem[22].y), "=d"(rmem[23].x), "=d"(rmem[23].y), "=d"(rmem[24].x), "=d"(rmem[24].y): "r"(smem), "l"(lut_dp_25_625), "d"(rmem[0].x), "d"(rmem[0].y), "d"(rmem[1].x), "d"(rmem[1].y), "d"(rmem[2].x), "d"(rmem[2].y), "d"(rmem[3].x), "d"(rmem[3].y), "d"(rmem[4].x), "d"(rmem[4].y), "d"(rmem[5].x), "d"(rmem[5].y), "d"(rmem[6].x), "d"(rmem[6].y), "d"(rmem[7].x), "d"(rmem[7].y), "d"(rmem[8].x), "d"(rmem[8].y), "d"(rmem[9].x), "d"(rmem[9].y), "d"(rmem[10].x), "d"(rmem[10].y), "d"(rmem[11].x), "d"(rmem[11].y), "d"(rmem[12].x), "d"(rmem[12].y), "d"(rmem[13].x), "d"(rmem[13].y), "d"(rmem[14].x), "d"(rmem[14].y), "d"(rmem[15].x), "d"(rmem[15].y), "d"(rmem[16].x), "d"(rmem[16].y), "d"(rmem[17].x), "d"(rmem[17].y), "d"(rmem[18].x), "d"(rmem[18].y), "d"(rmem[19].x), "d"(rmem[19].y), "d"(rmem[20].x), "d"(rmem[20].y), "d"(rmem[21].x), "d"(rmem[21].y), "d"(rmem[22].x), "d"(rmem[22].y), "d"(rmem[23].x), "d"(rmem[23].y), "d"(rmem[24].x), "d"(rmem[24].y), "d"(rmem[5].y), "d"(rmem[10].y), "d"(rmem[20].y), "d"(rmem[16].y), "d"(rmem[1].y), "d"(rmem[11].y), "d"(rmem[2].y), "d"(rmem[22].y), "d"(rmem[7].y), "d"(rmem[17].y), "d"(rmem[23].y), "d"(rmem[8].y), "d"(rmem[13].y), "d"(rmem[19].y), "d"(rmem[4].y), "d"(rmem[14].y));
};




template<> __forceinline__ __device__ void cufftdx_private_function<541, double, 1>(cufftdx::detail::complex<double> *rmem, unsigned smem){

asm volatile (R"({
.reg .b32 r<24>;
.reg .f64 fd<341>;
.reg .b64 rd<17>;
mov.u32 r1, %tid.y;
mov.u32 r2, %10;
mad.lo.s32 r3, r1, 5000, r2;
mov.u32 r4, %tid.x;
add.f64 fd21, %16, %24;
add.f64 fd22, %14, fd21;
add.f64 fd23, %19, %22;
add.f64 fd24, fd23, fd22;
add.f64 fd25, %18, %25;
add.f64 fd26, %15, fd25;
add.f64 fd27, %21, %23;
add.f64 fd28, fd27, fd26;
fma.rn.f64 fd29, fd21, 0d3FD3C6EF372FE950, %14;
mul.f64 fd30, fd23, 0d3FE9E3779B97F4A8;
sub.f64 fd31, fd29, fd30;
sub.f64 fd32, %18, %25;
mul.f64 fd33, fd32, 0d3FEE6F0E134454FF;
sub.f64 fd34, %21, %23;
mul.f64 fd35, fd34, 0dBFE2CF2304755A5E;
sub.f64 fd36, fd35, fd33;
sub.f64 fd37, fd31, fd36;
add.f64 fd38, fd36, fd31;
mul.f64 fd39, fd21, 0d3FE9E3779B97F4A8;
sub.f64 fd40, %14, fd39;
fma.rn.f64 fd41, fd23, 0d3FD3C6EF372FE950, fd40;
mul.f64 fd42, fd32, 0d3FE2CF2304755A5E;
mul.f64 fd43, fd34, 0d3FEE6F0E134454FF;
sub.f64 fd44, fd43, fd42;
sub.f64 fd45, fd41, fd44;
add.f64 fd46, fd44, fd41;
fma.rn.f64 fd47, fd25, 0d3FD3C6EF372FE950, %15;
mul.f64 fd48, fd27, 0d3FE9E3779B97F4A8;
sub.f64 fd49, fd47, fd48;
sub.f64 fd50, %16, %24;
mul.f64 fd51, fd50, 0d3FEE6F0E134454FF;
sub.f64 fd52, %19, %22;
mul.f64 fd53, fd52, 0dBFE2CF2304755A5E;
sub.f64 fd54, fd53, fd51;
add.f64 fd55, fd54, fd49;
sub.f64 fd56, fd49, fd54;
mul.f64 fd57, fd25, 0d3FE9E3779B97F4A8;
sub.f64 fd58, %15, fd57;
fma.rn.f64 fd59, fd27, 0d3FD3C6EF372FE950, fd58;
mul.f64 fd60, fd50, 0d3FE2CF2304755A5E;
mul.f64 fd61, fd52, 0d3FEE6F0E134454FF;
sub.f64 fd62, fd61, fd60;
add.f64 fd63, fd62, fd59;
sub.f64 fd64, fd59, fd62;
mul.wide.u32 rd2, r4, 274877907;
shr.u64 rd3, rd2, 35;
cvt.u32.u64 r5, rd3;
mul.lo.s32 r6, r5, 125;
sub.s32 r7, r4, r6;
mul.wide.u32 rd4, r7, 16;
mov.u64 rd5, %11;
add.s64 rd6, rd5, rd4;
ld.global.v2.f64 {fd65, fd66}, [rd6];
mul.f64 fd69, fd65, fd37;
mul.f64 fd70, fd66, fd55;
sub.f64 fd71, fd69, fd70;
mul.f64 fd72, fd65, fd55;
fma.rn.f64 fd73, fd66, fd37, fd72;
mul.f64 fd74, fd65, fd65;
mul.f64 fd75, fd66, fd66;
sub.f64 fd76, fd74, fd75;
mul.f64 fd77, fd66, fd65;
fma.rn.f64 fd78, fd66, fd65, fd77;
mul.f64 fd79, fd76, fd45;
mul.f64 fd80, fd78, fd63;
sub.f64 fd81, fd79, fd80;
mul.f64 fd82, fd76, fd63;
fma.rn.f64 fd83, fd78, fd45, fd82;
ld.global.v2.f64 {fd84, fd85}, [rd6+2000];
mul.f64 fd88, fd84, fd46;
mul.f64 fd89, fd85, fd64;
sub.f64 fd90, fd88, fd89;
mul.f64 fd91, fd84, fd64;
fma.rn.f64 fd92, fd85, fd46, fd91;
mul.f64 fd93, fd65, fd84;
mul.f64 fd94, fd66, fd85;
sub.f64 fd95, fd93, fd94;
mul.f64 fd96, fd65, fd85;
fma.rn.f64 fd97, fd66, fd84, fd96;
mul.f64 fd98, fd95, fd38;
mul.f64 fd99, fd97, fd56;
sub.f64 fd100, fd98, fd99;
mul.f64 fd101, fd95, fd56;
fma.rn.f64 fd102, fd97, fd38, fd101;
mad.lo.s32 r8, r5, 5000, r3;
barrier.sync 0;
mad.lo.s32 r9, r7, 40, r8;
st.shared.f64 [r9], fd24;
st.shared.f64 [r9+8], fd71;
st.shared.f64 [r9+16], fd81;
st.shared.f64 [r9+24], fd90;
st.shared.f64 [r9+32], fd100;
barrier.sync 0;
shl.b32 r10, r7, 5;
sub.s32 r11, r9, r10;
ld.shared.f64 fd103, [r11];
ld.shared.f64 fd104, [r11+1000];
ld.shared.f64 fd105, [r11+2000];
ld.shared.f64 fd106, [r11+3000];
ld.shared.f64 fd107, [r11+4000];
barrier.sync 0;
st.shared.f64 [r9], fd28;
st.shared.f64 [r9+8], fd73;
st.shared.f64 [r9+16], fd83;
st.shared.f64 [r9+24], fd92;
st.shared.f64 [r9+32], fd102;
barrier.sync 0;
ld.shared.f64 fd108, [r11];
ld.shared.f64 fd109, [r11+1000];
ld.shared.f64 fd110, [r11+2000];
ld.shared.f64 fd111, [r11+3000];
ld.shared.f64 fd112, [r11+4000];
add.f64 fd113, fd104, fd107;
add.f64 fd114, fd103, fd113;
add.f64 fd115, fd105, fd106;
add.f64 fd116, fd115, fd114;
add.f64 fd117, fd109, fd112;
add.f64 fd118, fd108, fd117;
add.f64 fd119, fd110, fd111;
add.f64 fd120, fd119, fd118;
fma.rn.f64 fd121, fd113, 0d3FD3C6EF372FE950, fd103;
mul.f64 fd122, fd115, 0d3FE9E3779B97F4A8;
sub.f64 fd123, fd121, fd122;
sub.f64 fd124, fd109, fd112;
mul.f64 fd125, fd124, 0d3FEE6F0E134454FF;
sub.f64 fd126, fd110, fd111;
mul.f64 fd127, fd126, 0dBFE2CF2304755A5E;
sub.f64 fd128, fd127, fd125;
sub.f64 fd129, fd123, fd128;
add.f64 fd130, fd128, fd123;
mul.f64 fd131, fd113, 0d3FE9E3779B97F4A8;
sub.f64 fd132, fd103, fd131;
fma.rn.f64 fd133, fd115, 0d3FD3C6EF372FE950, fd132;
mul.f64 fd134, fd124, 0d3FE2CF2304755A5E;
mul.f64 fd135, fd126, 0d3FEE6F0E134454FF;
sub.f64 fd136, fd135, fd134;
sub.f64 fd137, fd133, fd136;
add.f64 fd138, fd136, fd133;
fma.rn.f64 fd139, fd117, 0d3FD3C6EF372FE950, fd108;
mul.f64 fd140, fd119, 0d3FE9E3779B97F4A8;
sub.f64 fd141, fd139, fd140;
sub.f64 fd142, fd104, fd107;
mul.f64 fd143, fd142, 0d3FEE6F0E134454FF;
sub.f64 fd144, fd105, fd106;
mul.f64 fd145, fd144, 0dBFE2CF2304755A5E;
sub.f64 fd146, fd145, fd143;
add.f64 fd147, fd146, fd141;
sub.f64 fd148, fd141, fd146;
mul.f64 fd149, fd117, 0d3FE9E3779B97F4A8;
sub.f64 fd150, fd108, fd149;
fma.rn.f64 fd151, fd119, 0d3FD3C6EF372FE950, fd150;
mul.f64 fd152, fd142, 0d3FE2CF2304755A5E;
mul.f64 fd153, fd144, 0d3FEE6F0E134454FF;
sub.f64 fd154, fd153, fd152;
add.f64 fd155, fd154, fd151;
sub.f64 fd156, fd151, fd154;
mul.wide.u32 rd7, r7, -858993459;
shr.u64 rd8, rd7, 34;
cvt.u32.u64 r12, rd8;
mul.lo.s32 r13, r12, 5;
sub.s32 r14, r7, r13;
mul.wide.u32 rd9, r12, 16;
mov.u64 rd10, %12;
add.s64 rd11, rd10, rd9;
ld.global.v2.f64 {fd157, fd158}, [rd11];
mul.f64 fd161, fd157, fd129;
mul.f64 fd162, fd158, fd147;
sub.f64 fd163, fd161, fd162;
mul.f64 fd164, fd157, fd147;
fma.rn.f64 fd165, fd158, fd129, fd164;
mul.f64 fd166, fd157, fd157;
mul.f64 fd167, fd158, fd158;
sub.f64 fd168, fd166, fd167;
mul.f64 fd169, fd158, fd157;
fma.rn.f64 fd170, fd158, fd157, fd169;
mul.f64 fd171, fd168, fd137;
mul.f64 fd172, fd170, fd155;
sub.f64 fd173, fd171, fd172;
mul.f64 fd174, fd168, fd155;
fma.rn.f64 fd175, fd170, fd137, fd174;
ld.global.v2.f64 {fd176, fd177}, [rd11+400];
mul.f64 fd180, fd176, fd138;
mul.f64 fd181, fd177, fd156;
sub.f64 fd182, fd180, fd181;
mul.f64 fd183, fd176, fd156;
fma.rn.f64 fd184, fd177, fd138, fd183;
mul.f64 fd185, fd157, fd176;
mul.f64 fd186, fd158, fd177;
sub.f64 fd187, fd185, fd186;
mul.f64 fd188, fd157, fd177;
fma.rn.f64 fd189, fd158, fd176, fd188;
mul.f64 fd190, fd187, fd130;
mul.f64 fd191, fd189, fd148;
sub.f64 fd192, fd190, fd191;
mul.f64 fd193, fd187, fd148;
fma.rn.f64 fd194, fd189, fd130, fd193;
shl.b32 r15, r14, 3;
add.s32 r16, r8, r15;
barrier.sync 0;
mad.lo.s32 r17, r12, 200, r16;
st.shared.f64 [r17], fd116;
st.shared.f64 [r17+40], fd163;
st.shared.f64 [r17+80], fd173;
st.shared.f64 [r17+120], fd182;
st.shared.f64 [r17+160], fd192;
barrier.sync 0;
ld.shared.f64 fd195, [r11];
ld.shared.f64 fd196, [r11+1000];
ld.shared.f64 fd197, [r11+2000];
ld.shared.f64 fd198, [r11+3000];
ld.shared.f64 fd199, [r11+4000];
barrier.sync 0;
st.shared.f64 [r17], fd120;
st.shared.f64 [r17+40], fd165;
st.shared.f64 [r17+80], fd175;
st.shared.f64 [r17+120], fd184;
st.shared.f64 [r17+160], fd194;
barrier.sync 0;
ld.shared.f64 fd200, [r11];
ld.shared.f64 fd201, [r11+1000];
ld.shared.f64 fd202, [r11+2000];
ld.shared.f64 fd203, [r11+3000];
ld.shared.f64 fd204, [r11+4000];
add.f64 fd205, fd196, fd199;
add.f64 fd206, fd195, fd205;
add.f64 fd207, fd197, fd198;
add.f64 fd208, fd207, fd206;
add.f64 fd209, fd201, fd204;
add.f64 fd210, fd200, fd209;
add.f64 fd211, fd202, fd203;
add.f64 fd212, fd211, fd210;
fma.rn.f64 fd213, fd205, 0d3FD3C6EF372FE950, fd195;
mul.f64 fd214, fd207, 0d3FE9E3779B97F4A8;
sub.f64 fd215, fd213, fd214;
sub.f64 fd216, fd201, fd204;
mul.f64 fd217, fd216, 0d3FEE6F0E134454FF;
sub.f64 fd218, fd202, fd203;
mul.f64 fd219, fd218, 0dBFE2CF2304755A5E;
sub.f64 fd220, fd219, fd217;
sub.f64 fd221, fd215, fd220;
add.f64 fd222, fd220, fd215;
mul.f64 fd223, fd205, 0d3FE9E3779B97F4A8;
sub.f64 fd224, fd195, fd223;
fma.rn.f64 fd225, fd207, 0d3FD3C6EF372FE950, fd224;
mul.f64 fd226, fd216, 0d3FE2CF2304755A5E;
mul.f64 fd227, fd218, 0d3FEE6F0E134454FF;
sub.f64 fd228, fd227, fd226;
sub.f64 fd229, fd225, fd228;
add.f64 fd230, fd228, fd225;
fma.rn.f64 fd231, fd209, 0d3FD3C6EF372FE950, fd200;
mul.f64 fd232, fd211, 0d3FE9E3779B97F4A8;
sub.f64 fd233, fd231, fd232;
sub.f64 fd234, fd196, fd199;
mul.f64 fd235, fd234, 0d3FEE6F0E134454FF;
sub.f64 fd236, fd197, fd198;
mul.f64 fd237, fd236, 0dBFE2CF2304755A5E;
sub.f64 fd238, fd237, fd235;
add.f64 fd239, fd238, fd233;
sub.f64 fd240, fd233, fd238;
mul.f64 fd241, fd209, 0d3FE9E3779B97F4A8;
sub.f64 fd242, fd200, fd241;
fma.rn.f64 fd243, fd211, 0d3FD3C6EF372FE950, fd242;
mul.f64 fd244, fd234, 0d3FE2CF2304755A5E;
mul.f64 fd245, fd236, 0d3FEE6F0E134454FF;
sub.f64 fd246, fd245, fd244;
add.f64 fd247, fd246, fd243;
sub.f64 fd248, fd243, fd246;
mul.wide.u32 rd12, r7, 1374389535;
shr.u64 rd13, rd12, 35;
cvt.u32.u64 r18, rd13;
mul.lo.s32 r19, r18, 25;
sub.s32 r20, r7, r19;
mul.wide.u32 rd14, r18, 16;
mov.u64 rd15, %13;
add.s64 rd16, rd15, rd14;
ld.global.v2.f64 {fd249, fd250}, [rd16];
mul.f64 fd253, fd249, fd221;
mul.f64 fd254, fd250, fd239;
sub.f64 fd255, fd253, fd254;
mul.f64 fd256, fd249, fd239;
fma.rn.f64 fd257, fd250, fd221, fd256;
mul.f64 fd258, fd249, fd249;
mul.f64 fd259, fd250, fd250;
sub.f64 fd260, fd258, fd259;
mul.f64 fd261, fd250, fd249;
fma.rn.f64 fd262, fd250, fd249, fd261;
mul.f64 fd263, fd260, fd229;
mul.f64 fd264, fd262, fd247;
sub.f64 fd265, fd263, fd264;
mul.f64 fd266, fd260, fd247;
fma.rn.f64 fd267, fd262, fd229, fd266;
ld.global.v2.f64 {fd268, fd269}, [rd16+80];
mul.f64 fd272, fd268, fd230;
mul.f64 fd273, fd269, fd248;
sub.f64 fd274, fd272, fd273;
mul.f64 fd275, fd268, fd248;
fma.rn.f64 fd276, fd269, fd230, fd275;
mul.f64 fd277, fd249, fd268;
mul.f64 fd278, fd250, fd269;
sub.f64 fd279, fd277, fd278;
mul.f64 fd280, fd249, fd269;
fma.rn.f64 fd281, fd250, fd268, fd280;
mul.f64 fd282, fd279, fd222;
mul.f64 fd283, fd281, fd240;
sub.f64 fd284, fd282, fd283;
mul.f64 fd285, fd279, fd240;
fma.rn.f64 fd286, fd281, fd222, fd285;
shl.b32 r21, r20, 3;
add.s32 r22, r8, r21;
barrier.sync 0;
mad.lo.s32 r23, r18, 1000, r22;
st.shared.f64 [r23], fd208;
st.shared.f64 [r23+200], fd255;
st.shared.f64 [r23+400], fd265;
st.shared.f64 [r23+600], fd274;
st.shared.f64 [r23+800], fd284;
barrier.sync 0;
ld.shared.f64 fd287, [r11];
ld.shared.f64 fd288, [r11+1000];
ld.shared.f64 fd289, [r11+2000];
ld.shared.f64 fd290, [r11+3000];
ld.shared.f64 fd291, [r11+4000];
barrier.sync 0;
st.shared.f64 [r23], fd212;
st.shared.f64 [r23+200], fd257;
st.shared.f64 [r23+400], fd267;
st.shared.f64 [r23+600], fd276;
st.shared.f64 [r23+800], fd286;
barrier.sync 0;
ld.shared.f64 fd292, [r11];
ld.shared.f64 fd293, [r11+1000];
ld.shared.f64 fd294, [r11+2000];
ld.shared.f64 fd295, [r11+3000];
ld.shared.f64 fd296, [r11+4000];
add.f64 fd297, fd288, fd291;
add.f64 fd298, fd287, fd297;
add.f64 fd299, fd289, fd290;
add.f64 fd300, fd293, fd296;
add.f64 fd301, fd292, fd300;
add.f64 fd302, fd294, fd295;
fma.rn.f64 fd303, fd297, 0d3FD3C6EF372FE950, fd287;
mul.f64 fd304, fd299, 0d3FE9E3779B97F4A8;
sub.f64 fd305, fd303, fd304;
sub.f64 fd306, fd293, fd296;
mul.f64 fd307, fd306, 0d3FEE6F0E134454FF;
sub.f64 fd308, fd294, fd295;
mul.f64 fd309, fd308, 0dBFE2CF2304755A5E;
sub.f64 fd310, fd309, fd307;
mul.f64 fd311, fd297, 0d3FE9E3779B97F4A8;
sub.f64 fd312, fd287, fd311;
fma.rn.f64 fd313, fd299, 0d3FD3C6EF372FE950, fd312;
mul.f64 fd314, fd306, 0d3FE2CF2304755A5E;
mul.f64 fd315, fd308, 0d3FEE6F0E134454FF;
sub.f64 fd316, fd315, fd314;
fma.rn.f64 fd317, fd300, 0d3FD3C6EF372FE950, fd292;
mul.f64 fd318, fd302, 0d3FE9E3779B97F4A8;
sub.f64 fd319, fd317, fd318;
sub.f64 fd320, fd288, fd291;
mul.f64 fd321, fd320, 0d3FEE6F0E134454FF;
sub.f64 fd322, fd289, fd290;
mul.f64 fd323, fd322, 0dBFE2CF2304755A5E;
sub.f64 fd324, fd323, fd321;
mul.f64 fd325, fd300, 0d3FE9E3779B97F4A8;
sub.f64 fd326, fd292, fd325;
fma.rn.f64 fd327, fd302, 0d3FD3C6EF372FE950, fd326;
mul.f64 fd328, fd320, 0d3FE2CF2304755A5E;
mul.f64 fd329, fd322, 0d3FEE6F0E134454FF;
sub.f64 fd330, fd329, fd328;
add.f64 %0, fd299, fd298;
add.f64 %1, fd302, fd301;
add.f64 %3, fd324, fd319;
sub.f64 %2, fd305, fd310;
sub.f64 %4, fd313, fd316;
add.f64 %5, fd330, fd327;
add.f64 %6, fd316, fd313;
sub.f64 %7, fd327, fd330;
sub.f64 %9, fd319, fd324;
add.f64 %8, fd310, fd305;
})"
     : "=d"(rmem[0].x), "=d"(rmem[0].y), "=d"(rmem[1].x), "=d"(rmem[1].y), "=d"(rmem[2].x), "=d"(rmem[2].y), "=d"(rmem[3].x), "=d"(rmem[3].y), "=d"(rmem[4].x), "=d"(rmem[4].y): "r"(smem), "l"(lut_dp_5_625), "l"(lut_dp_5_125), "l"(lut_dp_5_25), "d"(rmem[0].x), "d"(rmem[0].y), "d"(rmem[1].x), "d"(rmem[1].y), "d"(rmem[1].y), "d"(rmem[2].x), "d"(rmem[2].y), "d"(rmem[2].y), "d"(rmem[3].x), "d"(rmem[3].y), "d"(rmem[4].x), "d"(rmem[4].y));
};




template<> __forceinline__ __device__ void cufftdx_private_function<542, double, 1>(cufftdx::detail::complex<double> *rmem, unsigned smem){

asm volatile (R"({
.reg .b32 r<24>;
.reg .f64 fd<371>;
.reg .b64 rd<17>;
mov.u32 r1, %tid.y;
mov.u32 r2, %10;
mad.lo.s32 r3, r1, 10000, r2;
mov.u32 r4, %tid.x;
add.f64 fd21, %16, %24;
add.f64 fd22, %14, fd21;
add.f64 fd23, %19, %22;
add.f64 fd24, %18, %25;
add.f64 fd25, %15, fd24;
add.f64 fd26, %21, %23;
fma.rn.f64 fd27, fd21, 0d3FD3C6EF372FE950, %14;
mul.f64 fd28, fd23, 0d3FE9E3779B97F4A8;
sub.f64 fd29, fd27, fd28;
sub.f64 fd30, %18, %25;
mul.f64 fd31, fd30, 0d3FEE6F0E134454FF;
sub.f64 fd32, %21, %23;
mul.f64 fd33, fd32, 0dBFE2CF2304755A5E;
sub.f64 fd34, fd33, fd31;
sub.f64 fd35, fd29, fd34;
add.f64 fd36, fd34, fd29;
mul.f64 fd37, fd21, 0d3FE9E3779B97F4A8;
sub.f64 fd38, %14, fd37;
fma.rn.f64 fd39, fd23, 0d3FD3C6EF372FE950, fd38;
mul.f64 fd40, fd30, 0d3FE2CF2304755A5E;
mul.f64 fd41, fd32, 0d3FEE6F0E134454FF;
sub.f64 fd42, fd41, fd40;
sub.f64 fd43, fd39, fd42;
add.f64 fd44, fd42, fd39;
fma.rn.f64 fd45, fd24, 0d3FD3C6EF372FE950, %15;
mul.f64 fd46, fd26, 0d3FE9E3779B97F4A8;
sub.f64 fd47, fd45, fd46;
sub.f64 fd48, %16, %24;
mul.f64 fd49, fd48, 0d3FEE6F0E134454FF;
sub.f64 fd50, %19, %22;
mul.f64 fd51, fd50, 0dBFE2CF2304755A5E;
sub.f64 fd52, fd51, fd49;
add.f64 fd53, fd52, fd47;
sub.f64 fd54, fd47, fd52;
mul.f64 fd55, fd24, 0d3FE9E3779B97F4A8;
sub.f64 fd56, %15, fd55;
fma.rn.f64 fd57, fd26, 0d3FD3C6EF372FE950, fd56;
mul.f64 fd58, fd48, 0d3FE2CF2304755A5E;
mul.f64 fd59, fd50, 0d3FEE6F0E134454FF;
sub.f64 fd60, fd59, fd58;
add.f64 fd61, fd60, fd57;
sub.f64 fd62, fd57, fd60;
mul.wide.u32 rd2, r4, 274877907;
shr.u64 rd3, rd2, 35;
cvt.u32.u64 r5, rd3;
mul.lo.s32 r6, r5, 125;
sub.s32 r7, r4, r6;
mad.lo.s32 r8, r5, 10000, r3;
mul.wide.u32 rd4, r7, 16;
mov.u64 rd5, %11;
add.s64 rd6, rd5, rd4;
ld.global.v2.f64 {fd63, fd64}, [rd6];
mul.f64 fd67, fd63, fd35;
mul.f64 fd68, fd64, fd53;
mul.f64 fd69, fd63, fd53;
mul.f64 fd70, fd63, fd63;
mul.f64 fd71, fd64, fd64;
sub.f64 fd72, fd70, fd71;
mul.f64 fd73, fd64, fd63;
fma.rn.f64 fd74, fd64, fd63, fd73;
mul.f64 fd75, fd72, fd43;
mul.f64 fd76, fd74, fd61;
mul.f64 fd77, fd72, fd61;
ld.global.v2.f64 {fd78, fd79}, [rd6+2000];
mul.f64 fd82, fd78, fd44;
mul.f64 fd83, fd79, fd62;
mul.f64 fd84, fd78, fd62;
mul.f64 fd85, fd63, fd78;
mul.f64 fd86, fd64, fd79;
sub.f64 fd87, fd85, fd86;
mul.f64 fd88, fd63, fd79;
fma.rn.f64 fd89, fd64, fd78, fd88;
mul.f64 fd90, fd87, fd36;
mul.f64 fd91, fd89, fd54;
mul.f64 fd92, fd87, fd54;
barrier.sync 0;
mad.lo.s32 r9, r7, 80, r8;
add.f64 fd93, fd26, fd25;
add.f64 fd94, fd23, fd22;
st.shared.v2.f64 [r9], {fd94, fd93};
fma.rn.f64 fd95, fd64, fd35, fd69;
sub.f64 fd96, fd67, fd68;
st.shared.v2.f64 [r9+16], {fd96, fd95};
fma.rn.f64 fd97, fd74, fd43, fd77;
sub.f64 fd98, fd75, fd76;
st.shared.v2.f64 [r9+32], {fd98, fd97};
fma.rn.f64 fd99, fd79, fd44, fd84;
sub.f64 fd100, fd82, fd83;
st.shared.v2.f64 [r9+48], {fd100, fd99};
fma.rn.f64 fd101, fd89, fd36, fd92;
sub.f64 fd102, fd90, fd91;
st.shared.v2.f64 [r9+64], {fd102, fd101};
barrier.sync 0;
shl.b32 r10, r7, 6;
sub.s32 r11, r9, r10;
ld.shared.v2.f64 {fd103, fd104}, [r11];
ld.shared.v2.f64 {fd107, fd108}, [r11+2000];
ld.shared.v2.f64 {fd111, fd112}, [r11+4000];
ld.shared.v2.f64 {fd115, fd116}, [r11+6000];
ld.shared.v2.f64 {fd119, fd120}, [r11+8000];
add.f64 fd123, fd107, fd119;
add.f64 fd124, fd103, fd123;
add.f64 fd125, fd111, fd115;
add.f64 fd126, fd108, fd120;
add.f64 fd127, fd104, fd126;
add.f64 fd128, fd112, fd116;
fma.rn.f64 fd129, fd123, 0d3FD3C6EF372FE950, fd103;
mul.f64 fd130, fd125, 0d3FE9E3779B97F4A8;
sub.f64 fd131, fd129, fd130;
sub.f64 fd132, fd108, fd120;
mul.f64 fd133, fd132, 0d3FEE6F0E134454FF;
sub.f64 fd134, fd112, fd116;
mul.f64 fd135, fd134, 0dBFE2CF2304755A5E;
sub.f64 fd136, fd135, fd133;
sub.f64 fd137, fd131, fd136;
add.f64 fd138, fd136, fd131;
mul.f64 fd139, fd123, 0d3FE9E3779B97F4A8;
sub.f64 fd140, fd103, fd139;
fma.rn.f64 fd141, fd125, 0d3FD3C6EF372FE950, fd140;
mul.f64 fd142, fd132, 0d3FE2CF2304755A5E;
mul.f64 fd143, fd134, 0d3FEE6F0E134454FF;
sub.f64 fd144, fd143, fd142;
sub.f64 fd145, fd141, fd144;
add.f64 fd146, fd144, fd141;
fma.rn.f64 fd147, fd126, 0d3FD3C6EF372FE950, fd104;
mul.f64 fd148, fd128, 0d3FE9E3779B97F4A8;
sub.f64 fd149, fd147, fd148;
sub.f64 fd150, fd107, fd119;
mul.f64 fd151, fd150, 0d3FEE6F0E134454FF;
sub.f64 fd152, fd111, fd115;
mul.f64 fd153, fd152, 0dBFE2CF2304755A5E;
sub.f64 fd154, fd153, fd151;
add.f64 fd155, fd154, fd149;
sub.f64 fd156, fd149, fd154;
mul.f64 fd157, fd126, 0d3FE9E3779B97F4A8;
sub.f64 fd158, fd104, fd157;
fma.rn.f64 fd159, fd128, 0d3FD3C6EF372FE950, fd158;
mul.f64 fd160, fd150, 0d3FE2CF2304755A5E;
mul.f64 fd161, fd152, 0d3FEE6F0E134454FF;
sub.f64 fd162, fd161, fd160;
add.f64 fd163, fd162, fd159;
sub.f64 fd164, fd159, fd162;
mul.wide.u32 rd7, r7, -858993459;
shr.u64 rd8, rd7, 34;
cvt.u32.u64 r12, rd8;
mul.lo.s32 r13, r12, 5;
sub.s32 r14, r7, r13;
mul.wide.u32 rd9, r12, 16;
mov.u64 rd10, %12;
add.s64 rd11, rd10, rd9;
ld.global.v2.f64 {fd165, fd166}, [rd11];
mul.f64 fd169, fd165, fd137;
mul.f64 fd170, fd166, fd155;
mul.f64 fd171, fd165, fd155;
mul.f64 fd172, fd165, fd165;
mul.f64 fd173, fd166, fd166;
sub.f64 fd174, fd172, fd173;
mul.f64 fd175, fd166, fd165;
fma.rn.f64 fd176, fd166, fd165, fd175;
mul.f64 fd177, fd174, fd145;
mul.f64 fd178, fd176, fd163;
mul.f64 fd179, fd174, fd163;
ld.global.v2.f64 {fd180, fd181}, [rd11+400];
mul.f64 fd184, fd180, fd146;
mul.f64 fd185, fd181, fd164;
mul.f64 fd186, fd180, fd164;
mul.f64 fd187, fd165, fd180;
mul.f64 fd188, fd166, fd181;
sub.f64 fd189, fd187, fd188;
mul.f64 fd190, fd165, fd181;
fma.rn.f64 fd191, fd166, fd180, fd190;
mul.f64 fd192, fd189, fd138;
mul.f64 fd193, fd191, fd156;
mul.f64 fd194, fd189, fd156;
shl.b32 r15, r14, 4;
add.s32 r16, r8, r15;
barrier.sync 0;
mad.lo.s32 r17, r12, 400, r16;
add.f64 fd195, fd128, fd127;
add.f64 fd196, fd125, fd124;
st.shared.v2.f64 [r17], {fd196, fd195};
fma.rn.f64 fd197, fd166, fd137, fd171;
sub.f64 fd198, fd169, fd170;
st.shared.v2.f64 [r17+80], {fd198, fd197};
fma.rn.f64 fd199, fd176, fd145, fd179;
sub.f64 fd200, fd177, fd178;
st.shared.v2.f64 [r17+160], {fd200, fd199};
fma.rn.f64 fd201, fd181, fd146, fd186;
sub.f64 fd202, fd184, fd185;
st.shared.v2.f64 [r17+240], {fd202, fd201};
fma.rn.f64 fd203, fd191, fd138, fd194;
sub.f64 fd204, fd192, fd193;
st.shared.v2.f64 [r17+320], {fd204, fd203};
barrier.sync 0;
ld.shared.v2.f64 {fd205, fd206}, [r11];
ld.shared.v2.f64 {fd209, fd210}, [r11+2000];
ld.shared.v2.f64 {fd213, fd214}, [r11+4000];
ld.shared.v2.f64 {fd217, fd218}, [r11+6000];
ld.shared.v2.f64 {fd221, fd222}, [r11+8000];
add.f64 fd225, fd209, fd221;
add.f64 fd226, fd205, fd225;
add.f64 fd227, fd213, fd217;
add.f64 fd228, fd210, fd222;
add.f64 fd229, fd206, fd228;
add.f64 fd230, fd214, fd218;
fma.rn.f64 fd231, fd225, 0d3FD3C6EF372FE950, fd205;
mul.f64 fd232, fd227, 0d3FE9E3779B97F4A8;
sub.f64 fd233, fd231, fd232;
sub.f64 fd234, fd210, fd222;
mul.f64 fd235, fd234, 0d3FEE6F0E134454FF;
sub.f64 fd236, fd214, fd218;
mul.f64 fd237, fd236, 0dBFE2CF2304755A5E;
sub.f64 fd238, fd237, fd235;
sub.f64 fd239, fd233, fd238;
add.f64 fd240, fd238, fd233;
mul.f64 fd241, fd225, 0d3FE9E3779B97F4A8;
sub.f64 fd242, fd205, fd241;
fma.rn.f64 fd243, fd227, 0d3FD3C6EF372FE950, fd242;
mul.f64 fd244, fd234, 0d3FE2CF2304755A5E;
mul.f64 fd245, fd236, 0d3FEE6F0E134454FF;
sub.f64 fd246, fd245, fd244;
sub.f64 fd247, fd243, fd246;
add.f64 fd248, fd246, fd243;
fma.rn.f64 fd249, fd228, 0d3FD3C6EF372FE950, fd206;
mul.f64 fd250, fd230, 0d3FE9E3779B97F4A8;
sub.f64 fd251, fd249, fd250;
sub.f64 fd252, fd209, fd221;
mul.f64 fd253, fd252, 0d3FEE6F0E134454FF;
sub.f64 fd254, fd213, fd217;
mul.f64 fd255, fd254, 0dBFE2CF2304755A5E;
sub.f64 fd256, fd255, fd253;
add.f64 fd257, fd256, fd251;
sub.f64 fd258, fd251, fd256;
mul.f64 fd259, fd228, 0d3FE9E3779B97F4A8;
sub.f64 fd260, fd206, fd259;
fma.rn.f64 fd261, fd230, 0d3FD3C6EF372FE950, fd260;
mul.f64 fd262, fd252, 0d3FE2CF2304755A5E;
mul.f64 fd263, fd254, 0d3FEE6F0E134454FF;
sub.f64 fd264, fd263, fd262;
add.f64 fd265, fd264, fd261;
sub.f64 fd266, fd261, fd264;
mul.wide.u32 rd12, r7, 1374389535;
shr.u64 rd13, rd12, 35;
cvt.u32.u64 r18, rd13;
mul.lo.s32 r19, r18, 25;
sub.s32 r20, r7, r19;
mul.wide.u32 rd14, r18, 16;
mov.u64 rd15, %13;
add.s64 rd16, rd15, rd14;
ld.global.v2.f64 {fd267, fd268}, [rd16];
mul.f64 fd271, fd267, fd239;
mul.f64 fd272, fd268, fd257;
mul.f64 fd273, fd267, fd257;
mul.f64 fd274, fd267, fd267;
mul.f64 fd275, fd268, fd268;
sub.f64 fd276, fd274, fd275;
mul.f64 fd277, fd268, fd267;
fma.rn.f64 fd278, fd268, fd267, fd277;
mul.f64 fd279, fd276, fd247;
mul.f64 fd280, fd278, fd265;
mul.f64 fd281, fd276, fd265;
ld.global.v2.f64 {fd282, fd283}, [rd16+80];
mul.f64 fd286, fd282, fd248;
mul.f64 fd287, fd283, fd266;
mul.f64 fd288, fd282, fd266;
mul.f64 fd289, fd267, fd282;
mul.f64 fd290, fd268, fd283;
sub.f64 fd291, fd289, fd290;
mul.f64 fd292, fd267, fd283;
fma.rn.f64 fd293, fd268, fd282, fd292;
mul.f64 fd294, fd291, fd240;
mul.f64 fd295, fd293, fd258;
mul.f64 fd296, fd291, fd258;
shl.b32 r21, r20, 4;
add.s32 r22, r8, r21;
barrier.sync 0;
mad.lo.s32 r23, r18, 2000, r22;
add.f64 fd297, fd230, fd229;
add.f64 fd298, fd227, fd226;
st.shared.v2.f64 [r23], {fd298, fd297};
fma.rn.f64 fd299, fd268, fd239, fd273;
sub.f64 fd300, fd271, fd272;
st.shared.v2.f64 [r23+400], {fd300, fd299};
fma.rn.f64 fd301, fd278, fd247, fd281;
sub.f64 fd302, fd279, fd280;
st.shared.v2.f64 [r23+800], {fd302, fd301};
fma.rn.f64 fd303, fd283, fd248, fd288;
sub.f64 fd304, fd286, fd287;
st.shared.v2.f64 [r23+1200], {fd304, fd303};
fma.rn.f64 fd305, fd293, fd240, fd296;
sub.f64 fd306, fd294, fd295;
st.shared.v2.f64 [r23+1600], {fd306, fd305};
barrier.sync 0;
ld.shared.v2.f64 {fd307, fd308}, [r11];
ld.shared.v2.f64 {fd311, fd312}, [r11+2000];
ld.shared.v2.f64 {fd315, fd316}, [r11+4000];
ld.shared.v2.f64 {fd319, fd320}, [r11+6000];
ld.shared.v2.f64 {fd323, fd324}, [r11+8000];
add.f64 fd327, fd311, fd323;
add.f64 fd328, fd307, fd327;
add.f64 fd329, fd315, fd319;
add.f64 fd330, fd312, fd324;
add.f64 fd331, fd308, fd330;
add.f64 fd332, fd316, fd320;
fma.rn.f64 fd333, fd327, 0d3FD3C6EF372FE950, fd307;
mul.f64 fd334, fd329, 0d3FE9E3779B97F4A8;
sub.f64 fd335, fd333, fd334;
sub.f64 fd336, fd312, fd324;
mul.f64 fd337, fd336, 0d3FEE6F0E134454FF;
sub.f64 fd338, fd316, fd320;
mul.f64 fd339, fd338, 0dBFE2CF2304755A5E;
sub.f64 fd340, fd339, fd337;
mul.f64 fd341, fd327, 0d3FE9E3779B97F4A8;
sub.f64 fd342, fd307, fd341;
fma.rn.f64 fd343, fd329, 0d3FD3C6EF372FE950, fd342;
mul.f64 fd344, fd336, 0d3FE2CF2304755A5E;
mul.f64 fd345, fd338, 0d3FEE6F0E134454FF;
sub.f64 fd346, fd345, fd344;
fma.rn.f64 fd347, fd330, 0d3FD3C6EF372FE950, fd308;
mul.f64 fd348, fd332, 0d3FE9E3779B97F4A8;
sub.f64 fd349, fd347, fd348;
sub.f64 fd350, fd311, fd323;
mul.f64 fd351, fd350, 0d3FEE6F0E134454FF;
sub.f64 fd352, fd315, fd319;
mul.f64 fd353, fd352, 0dBFE2CF2304755A5E;
sub.f64 fd354, fd353, fd351;
mul.f64 fd355, fd330, 0d3FE9E3779B97F4A8;
sub.f64 fd356, fd308, fd355;
fma.rn.f64 fd357, fd332, 0d3FD3C6EF372FE950, fd356;
mul.f64 fd358, fd350, 0d3FE2CF2304755A5E;
mul.f64 fd359, fd352, 0d3FEE6F0E134454FF;
sub.f64 fd360, fd359, fd358;
add.f64 %1, fd332, fd331;
add.f64 %0, fd329, fd328;
add.f64 %3, fd354, fd349;
sub.f64 %2, fd335, fd340;
add.f64 %5, fd360, fd357;
sub.f64 %4, fd343, fd346;
sub.f64 %7, fd357, fd360;
add.f64 %6, fd346, fd343;
sub.f64 %9, fd349, fd354;
add.f64 %8, fd340, fd335;
})"
     : "=d"(rmem[0].x), "=d"(rmem[0].y), "=d"(rmem[1].x), "=d"(rmem[1].y), "=d"(rmem[2].x), "=d"(rmem[2].y), "=d"(rmem[3].x), "=d"(rmem[3].y), "=d"(rmem[4].x), "=d"(rmem[4].y): "r"(smem), "l"(lut_dp_5_625), "l"(lut_dp_5_125), "l"(lut_dp_5_25), "d"(rmem[0].x), "d"(rmem[0].y), "d"(rmem[1].x), "d"(rmem[1].y), "d"(rmem[1].y), "d"(rmem[2].x), "d"(rmem[2].y), "d"(rmem[2].y), "d"(rmem[3].x), "d"(rmem[3].y), "d"(rmem[4].x), "d"(rmem[4].y));
};


#endif
